From fd2a77678d433c0f23e3495f0d16fb16d29a4044 Mon Sep 17 00:00:00 2001 From: Connor Shorten Date: Fri, 21 Feb 2025 11:59:41 -0500 Subject: [PATCH] rerun benchmark with fixes --- src/docker-compose.yml | 2 +- src/lm/lm.py | 7 + src/models.py | 15 +- src/optimizers/setup_database.py | 2 +- src/test_gorilla/gpt-4o-02-21-25.json | 46885 ++++++++++++++++ src/test_gorilla/gpt-4o-mini-02-21-25.json | 46310 ++++++++++++++++ src/test_gorilla/grok-2-latest-02-21-25.json | 47008 +++++++++++++++++ src/test_gorilla/main_test.py | 73 +- src/utils/weaviate_fc_utils.py | 30 +- 9 files changed, 140293 insertions(+), 39 deletions(-) create mode 100644 src/test_gorilla/gpt-4o-02-21-25.json create mode 100644 src/test_gorilla/gpt-4o-mini-02-21-25.json create mode 100644 src/test_gorilla/grok-2-latest-02-21-25.json diff --git a/src/docker-compose.yml b/src/docker-compose.yml index 2bd13ad..7143811 100644 --- a/src/docker-compose.yml +++ b/src/docker-compose.yml @@ -20,7 +20,7 @@ services: AUTHENTICATION_ANONYMOUS_ACCESS_ENABLED: 'true' PERSISTENCE_DATA_PATH: '/var/lib/weaviate' DEFAULT_VECTORIZER_MODULE: 'text2vec-openai' - OPENAI_API_KEY: '' + OPENAI_API_KEY: 'YOUR_OPENAI_API_KEY' ENABLE_MODULES: 'text2vec-openai' ENABLE_API_BASED_MODULES: 'true' CLUSTER_HOSTNAME: 'node1' diff --git a/src/lm/lm.py b/src/lm/lm.py index 03b144b..dd95b7a 100644 --- a/src/lm/lm.py +++ b/src/lm/lm.py @@ -21,6 +21,7 @@ # google models are accessed through the openai SDK with a check on `model_name` # together models are accessed through the openai SDK with a different base URL +# grok models are accessed through the openai SDK with a different base URL LMModelProvider = Literal["ollama", "openai", "anthropic", "cohere", "together"] # need to add models to this...! @@ -45,6 +46,12 @@ def __init__( api_key=api_key, base_url="https://generativelanguage.googleapis.com/v1beta/" ) + elif self.model_name.startswith("grok-"): + print("\033[96mUsing Grok through the OpenAI SDK.\033[0m") + self.lm_client = openai.OpenAI( + api_key=api_key, + base_url="https://api.x.ai/v1" + ) else: self.lm_client = openai.OpenAI( api_key=api_key diff --git a/src/models.py b/src/models.py index cbef6aa..5b4a28c 100644 --- a/src/models.py +++ b/src/models.py @@ -125,18 +125,6 @@ class SyntheticFilterQueries(BaseModel): boolean_property_filter_query: BooleanPropertyFilterWithQuery class WeaviateQuery(BaseModel): - corresponding_natural_language_query: str - target_collection: str - search_query: Optional[str] - integer_property_filter: Optional[IntPropertyFilter] - text_property_filter: Optional[TextPropertyFilter] - boolean_property_filter: Optional[BooleanPropertyFilter] - integer_property_aggregation: Optional[IntAggregation] - text_property_aggregation: Optional[TextAggregation] - boolean_property_aggregation: Optional[BooleanAggregation] - groupby_property: Optional[str] - -class NewWeaviateQuery(BaseModel): corresponding_natural_language_query: Optional[str] = None target_collection: str search_query: Optional[str] = None @@ -371,5 +359,4 @@ class TogetherAIFunction(BaseModel): class TogetherAITool(BaseModel): type: Literal["function"] - function: TogetherAIFunction - + function: TogetherAIFunction \ No newline at end of file diff --git a/src/optimizers/setup_database.py b/src/optimizers/setup_database.py index 5fb8029..025491a 100644 --- a/src/optimizers/setup_database.py +++ b/src/optimizers/setup_database.py @@ -7,7 +7,7 @@ # Connect to Weaviate and populate datasets client = weaviate.connect_to_local( headers={ - "X-OpenAI-Api-Key": "" + "X-OpenAI-Api-Key": os.getenv("OPENAI_API_KEY") } ) WEAVIATE_URL = "http://localhost:8080/v1/schema" diff --git a/src/test_gorilla/gpt-4o-02-21-25.json b/src/test_gorilla/gpt-4o-02-21-25.json new file mode 100644 index 0000000..2bd8d06 --- /dev/null +++ b/src/test_gorilla/gpt-4o-02-21-25.json @@ -0,0 +1,46885 @@ +{ + "timestamp": "2025-02-21T11:57:05.869365", + "model_name": "gpt-4o", + "generate_with_models": false, + "total_queries": 315, + "successful_predictions": 308, + "failed_predictions": 7, + "average_ast_score": 0.8228084415584404, + "perfect_matches": 190, + "per_schema_scores": { + "0": 0.8632812500000002, + "1": 0.9332031250000004, + "2": 0.9015625000000004, + "3": 0.41953125000000013 + }, + "detailed_results": [ + { + "query_index": 0, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine, where the average rating is at least 4, count how many such restaurants there are, and group them by whether they are currently open or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine, where the average rating is at least 4, count how many such restaurants there are, and group them by whether they are currently open or not.", + "target_collection": "Restaurants", + "search_query": "Find restaurants with a cozy ambiance and Italian cuisine", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine, where the average rating is at least 4, count how many such restaurants there are, and group them by whether they are currently open or not.", + "target_collection": "Restaurants", + "search_query": "cozy ambiance and Italian cuisine", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 1, + "database_schema_index": 0, + "natural_language_query": "Find Italian cuisine restaurants with a cozy ambiance that have an average rating of at least 4, plus provide the count of such restaurants that are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find Italian cuisine restaurants with a cozy ambiance that have an average rating of at least 4, plus provide the count of such restaurants that are currently open.", + "target_collection": "Restaurants", + "search_query": "Find restaurants with cozy ambiance and Italian cuisine", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find Italian cuisine restaurants with a cozy ambiance that have an average rating of at least 4, plus provide the count of such restaurants that are currently open.", + "target_collection": "Restaurants", + "search_query": "Italian cuisine restaurants with a cozy ambiance", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 2, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that match the description 'authentic Italian ambiance', have an averageRating greater than 4, list the top 5 most common restaurant names in this set, and partition the results based on whether the restaurant is currently open or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that match the description 'authentic Italian ambiance', have an averageRating greater than 4, list the top 5 most common restaurant names in this set, and partition the results based on whether the restaurant is currently open or not.", + "target_collection": "Restaurants", + "search_query": "authentic Italian ambiance", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that match the description 'authentic Italian ambiance', have an averageRating greater than 4, list the top 5 most common restaurant names in this set, and partition the results based on whether the restaurant is currently open or not.", + "target_collection": "Restaurants", + "search_query": "authentic Italian ambiance", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "restaurantName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 3, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with a family-friendly ambiance and Italian cuisine rated with at least 4.5 in averageRating, and identify the top 3 most common descriptions.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with a family-friendly ambiance and Italian cuisine rated with at least 4.5 in averageRating, and identify the top 3 most common descriptions.", + "target_collection": "Restaurants", + "search_query": "Find restaurants with a family-friendly ambiance and Italian cuisine", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with a family-friendly ambiance and Italian cuisine rated with at least 4.5 in averageRating, and identify the top 3 most common descriptions.", + "target_collection": "Restaurants", + "search_query": "family-friendly ambiance Italian cuisine", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 4, + "database_schema_index": 0, + "natural_language_query": "Find restaurants offering Italian cuisine with a cozy atmosphere, with at least an average rating of 4.5. Also, calculate the percentage of these restaurants that are open and group results based on their open status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants offering Italian cuisine with a cozy atmosphere, with at least an average rating of 4.5. Also, calculate the percentage of these restaurants that are open and group results based on their open status.", + "target_collection": "Restaurants", + "search_query": "Find restaurants offering Italian cuisine with a cozy atmosphere", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants offering Italian cuisine with a cozy atmosphere, with at least an average rating of 4.5. Also, calculate the percentage of these restaurants that are open and group results based on their open status.", + "target_collection": "Restaurants", + "search_query": "Italian cuisine with a cozy atmosphere", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 5, + "database_schema_index": 0, + "natural_language_query": "Find Italian cuisine restaurants with descriptions containing 'Italian cuisine', with averageRating greater than 4.0, and calculate the percentage of these that are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find Italian cuisine restaurants with descriptions containing 'Italian cuisine', with averageRating greater than 4.0, and calculate the percentage of these that are currently open.", + "target_collection": "Restaurants", + "search_query": "Search for restaurants with descriptions containing 'Italian cuisine'", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find Italian cuisine restaurants with descriptions containing 'Italian cuisine', with averageRating greater than 4.0, and calculate the percentage of these that are currently open.", + "target_collection": "Restaurants", + "search_query": "Italian cuisine", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "description.cuisine", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 6, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that are similar to Italian family-friendly places, have an averageRating of at least 4, and group them by whether they are currently open (openNow).", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that are similar to Italian family-friendly places, have an averageRating of at least 4, and group them by whether they are currently open (openNow).", + "target_collection": "Restaurants", + "search_query": "Italian, family-friendly ambiance", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that are similar to Italian family-friendly places, have an averageRating of at least 4, and group them by whether they are currently open (openNow).", + "target_collection": "Restaurants", + "search_query": "Italian family-friendly places", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 7, + "database_schema_index": 0, + "natural_language_query": "Find Italian restaurants with a cozy ambiance, and the averageRating must be greater than 4.0.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find Italian restaurants with a cozy ambiance, and the averageRating must be greater than 4.0.", + "target_collection": "Restaurants", + "search_query": "Looking for Italian restaurants with a cozy ambiance", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find Italian restaurants with a cozy ambiance, and the averageRating must be greater than 4.0.", + "target_collection": "Restaurants", + "search_query": "Italian restaurants with a cozy ambiance", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 8, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with an Italian ambiance and explicitly mentioned as family friendly in their description, calculate the average of each restaurant's averageRating, and group the results by restaurant name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with an Italian ambiance and explicitly mentioned as family friendly in their description, calculate the average of each restaurant's averageRating, and group the results by restaurant name.", + "target_collection": "Restaurants", + "search_query": "Italian ambiance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "family friendly" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with an Italian ambiance and explicitly mentioned as family friendly in their description, calculate the average of each restaurant's averageRating, and group the results by restaurant name.", + "target_collection": "Restaurants", + "search_query": "Italian ambiance family friendly", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 9, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that have a romantic ambiance using search query, filter the results to include only those where the name contains 'Ristorante', and count the number of these restaurants using the averageRating property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that have a romantic ambiance using search query, filter the results to include only those where the name contains 'Ristorante', and count the number of these restaurants using the averageRating property.", + "target_collection": "Restaurants", + "search_query": "romantic ambiance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "Ristorante" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that have a romantic ambiance using search query, filter the results to include only those where the name contains 'Ristorante', and count the number of these restaurants using the averageRating property.", + "target_collection": "Restaurants", + "search_query": "romantic ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "%Ristorante%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 10, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with a cozy and modern ambiance that mention 'casual dining' in their description. Count the number of unique restaurant names and group the results by whether they are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with a cozy and modern ambiance that mention 'casual dining' in their description. Count the number of unique restaurant names and group the results by whether they are currently open.", + "target_collection": "Restaurants", + "search_query": "Cozy and modern ambiance with festive atmosphere", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "%casual dining%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with a cozy and modern ambiance that mention 'casual dining' in their description. Count the number of unique restaurant names and group the results by whether they are currently open.", + "target_collection": "Restaurants", + "search_query": "cozy and modern ambiance casual dining", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 11, + "database_schema_index": 0, + "natural_language_query": "Search for restaurants similar in description and ambiance to those fitting the concept of cozy and modern cuisine, filter to only include restaurants named exactly 'Ocean View Grille', and count the occurrences of each restaurant name in the results.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Search for restaurants similar in description and ambiance to those fitting the concept of cozy and modern cuisine, filter to only include restaurants named exactly 'Ocean View Grille', and count the occurrences of each restaurant name in the results.", + "target_collection": "Restaurants", + "search_query": "Find the most relevant restaurants based on their description of the cuisine and ambiance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Ocean View Grille" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for restaurants similar in description and ambiance to those fitting the concept of cozy and modern cuisine, filter to only include restaurants named exactly 'Ocean View Grille', and count the occurrences of each restaurant name in the results.", + "target_collection": "Restaurants", + "search_query": "cozy modern cuisine", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Ocean View Grille" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 12, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with a nature ambiance, having Italian cuisine in their description, calculate the percentage of restaurants currently open, and group them by their average rating to summarize.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with a nature ambiance, having Italian cuisine in their description, calculate the percentage of restaurants currently open, and group them by their average rating to summarize.", + "target_collection": "Restaurants", + "search_query": "nature ambiance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "Italian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with a nature ambiance, having Italian cuisine in their description, calculate the percentage of restaurants currently open, and group them by their average rating to summarize.", + "target_collection": "Restaurants", + "search_query": "nature ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 13, + "database_schema_index": 0, + "natural_language_query": "Find restaurants similar to a cozy Italian restaurant with a great wine selection, include only those whose name contains 'Grill', and count how many of them are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants similar to a cozy Italian restaurant with a great wine selection, include only those whose name contains 'Grill', and count how many of them are currently open.", + "target_collection": "Restaurants", + "search_query": "A cozy Italian restaurant with a great wine selection", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "Grill" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants similar to a cozy Italian restaurant with a great wine selection, include only those whose name contains 'Grill', and count how many of them are currently open.", + "target_collection": "Restaurants", + "search_query": "cozy Italian restaurant with a great wine selection", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "%Grill%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 14, + "database_schema_index": 0, + "natural_language_query": "Find restaurants offering authentic Italian cuisine while they are open now, and group these restaurants by their average rating.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants offering authentic Italian cuisine while they are open now, and group these restaurants by their average rating.", + "target_collection": "Restaurants", + "search_query": "authentic Italian cuisine", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants offering authentic Italian cuisine while they are open now, and group these restaurants by their average rating.", + "target_collection": "Restaurants", + "search_query": "authentic Italian cuisine", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 15, + "database_schema_index": 0, + "natural_language_query": "Search for restaurants that are famous for Italian cuisine using semantic search for 'cuisine' and 'ambiance', and additionally filter to show only those whose description explicitly contains the word 'romantic'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Search for restaurants that are famous for Italian cuisine using semantic search for 'cuisine' and 'ambiance', and additionally filter to show only those whose description explicitly contains the word 'romantic'.", + "target_collection": "Restaurants", + "search_query": "Find restaurants known for Italian cuisine with a romantic ambiance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "romantic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for restaurants that are famous for Italian cuisine using semantic search for 'cuisine' and 'ambiance', and additionally filter to show only those whose description explicitly contains the word 'romantic'.", + "target_collection": "Restaurants", + "search_query": "Italian cuisine ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "romantic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 16, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that offer a romantic ambiance and Italian cuisine, ensure they are open now, calculate the average rating, and organize the results by each restaurant's name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that offer a romantic ambiance and Italian cuisine, ensure they are open now, calculate the average rating, and organize the results by each restaurant's name.", + "target_collection": "Restaurants", + "search_query": "Find restaurants that offer a romantic ambiance and Italian cuisine", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that offer a romantic ambiance and Italian cuisine, ensure they are open now, calculate the average rating, and organize the results by each restaurant's name.", + "target_collection": "Restaurants", + "search_query": "romantic ambiance Italian", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 17, + "database_schema_index": 0, + "natural_language_query": "Find cozy Italian restaurants with a great wine selection that are open now, and calculate the average rating of these open restaurants.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find cozy Italian restaurants with a great wine selection that are open now, and calculate the average rating of these open restaurants.", + "target_collection": "Restaurants", + "search_query": "Looking for cozy Italian restaurants with a great wine selection", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find cozy Italian restaurants with a great wine selection that are open now, and calculate the average rating of these open restaurants.", + "target_collection": "Restaurants", + "search_query": "cozy Italian restaurants with a great wine selection", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 18, + "database_schema_index": 0, + "natural_language_query": "What are the romantic Italian restaurants that are currently open now, and what is the most common description among them, grouped by their name?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What are the romantic Italian restaurants that are currently open now, and what is the most common description among them, grouped by their name?", + "target_collection": "Restaurants", + "search_query": "Find restaurants matching 'romantic Italian dining'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the romantic Italian restaurants that are currently open now, and what is the most common description among them, grouped by their name?", + "target_collection": "Restaurants", + "search_query": "romantic Italian restaurants", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 19, + "database_schema_index": 0, + "natural_language_query": "Find restaurants offering Mediterranean cuisine with a cozy ambiance and are currently open, then list the top 5 most common restaurant names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants offering Mediterranean cuisine with a cozy ambiance and are currently open, then list the top 5 most common restaurant names.", + "target_collection": "Restaurants", + "search_query": "Explore Mediterranean cuisine with a cozy ambiance", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants offering Mediterranean cuisine with a cozy ambiance and are currently open, then list the top 5 most common restaurant names.", + "target_collection": "Restaurants", + "search_query": "Mediterranean cuisine with a cozy ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 20, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that are known for their cozy ambiance and Italian cuisine, filter those that are currently open, aggregate to count how many are open versus closed, and organize results by the name of the restaurant.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that are known for their cozy ambiance and Italian cuisine, filter those that are currently open, aggregate to count how many are open versus closed, and organize results by the name of the restaurant.", + "target_collection": "Restaurants", + "search_query": "Find restaurants that are known for their cozy ambiance and Italian cuisine.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that are known for their cozy ambiance and Italian cuisine, filter those that are currently open, aggregate to count how many are open versus closed, and organize results by the name of the restaurant.", + "target_collection": "Restaurants", + "search_query": "cozy ambiance Italian cuisine", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 21, + "database_schema_index": 0, + "natural_language_query": "Find restaurants serving Italian cuisine with a romantic ambiance that are currently open, and calculate the percentage of restaurants that are open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants serving Italian cuisine with a romantic ambiance that are currently open, and calculate the percentage of restaurants that are open.", + "target_collection": "Restaurants", + "search_query": "Find restaurants serving Italian cuisine with a romantic ambiance", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants serving Italian cuisine with a romantic ambiance that are currently open, and calculate the percentage of restaurants that are open.", + "target_collection": "Restaurants", + "search_query": "Italian cuisine with a romantic ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 22, + "database_schema_index": 0, + "natural_language_query": "Find cozy Italian restaurants that are currently open, and group them by their name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find cozy Italian restaurants that are currently open, and group them by their name.", + "target_collection": "Restaurants", + "search_query": "Find cozy Italian restaurants", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find cozy Italian restaurants that are currently open, and group them by their name.", + "target_collection": "Restaurants", + "search_query": "cozy Italian restaurants", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 23, + "database_schema_index": 0, + "natural_language_query": "Find currently open restaurants that conceptually relate to 'Italian cuisine with a cozy ambiance.'", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find currently open restaurants that conceptually relate to 'Italian cuisine with a cozy ambiance.'", + "target_collection": "Restaurants", + "search_query": "Find restaurants serving Italian cuisine with a cozy ambiance", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find currently open restaurants that conceptually relate to 'Italian cuisine with a cozy ambiance.'", + "target_collection": "Restaurants", + "search_query": "Italian cuisine with a cozy ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 24, + "database_schema_index": 0, + "natural_language_query": "What are the total party sizes of reservations that mention 'birthday' in notes, grouped by whether the reservation is confirmed?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What are the total party sizes of reservations that mention 'birthday' in notes, grouped by whether the reservation is confirmed?", + "target_collection": "Reservations", + "search_query": "Find reservations where the notes mention 'birthday'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "confirmed" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the total party sizes of reservations that mention 'birthday' in notes, grouped by whether the reservation is confirmed?", + "target_collection": "Reservations", + "search_query": "birthday", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "isConfirmed", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 25, + "database_schema_index": 0, + "natural_language_query": "What is the average price of spicy vegetarian menu items?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What is the average price of spicy vegetarian menu items?", + "target_collection": "Menus", + "search_query": "Find menu items with a description that matches 'spicy vegetarian options'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "price", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average price of spicy vegetarian menu items?", + "target_collection": "Menu_items", + "search_query": "spicy vegetarian", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "price", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 26, + "database_schema_index": 0, + "natural_language_query": "Identify romantic restaurants by analyzing descriptions for ambiance, count the number of unique restaurants, and group the results by whether they are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Identify romantic restaurants by analyzing descriptions for ambiance, count the number of unique restaurants, and group the results by whether they are currently open.", + "target_collection": "Restaurants", + "search_query": "Find restaurants that offer a romantic ambiance.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 27, + "database_schema_index": 0, + "natural_language_query": "Identify how many unique restaurants offer a cozy Italian cuisine with a romantic ambiance by analyzing their descriptions and count the occurrences of different restaurant names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Identify how many unique restaurants offer a cozy Italian cuisine with a romantic ambiance by analyzing their descriptions and count the occurrences of different restaurant names.", + "target_collection": "Restaurants", + "search_query": "Find restaurants with a description that matches 'cozy Italian cuisine with romantic ambiance'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify how many unique restaurants offer a cozy Italian cuisine with a romantic ambiance by analyzing their descriptions and count the occurrences of different restaurant names.", + "target_collection": "Restaurants", + "search_query": "cozy Italian cuisine with a romantic ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 28, + "database_schema_index": 0, + "natural_language_query": "What percentage of restaurants that offer outdoor seating and live music are currently open, and how are they distributed by their average rating?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What percentage of restaurants that offer outdoor seating and live music are currently open, and how are they distributed by their average rating?", + "target_collection": "Restaurants", + "search_query": "Find restaurants that offer outdoor seating and live music.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "What percentage of restaurants that offer outdoor seating and live music are currently open, and how are they distributed by their average rating?", + "target_collection": "Restaurants", + "search_query": "outdoor seating and live music", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 29, + "database_schema_index": 0, + "natural_language_query": "What percentage of confirmed reservations mention the word 'celebration' in the notes?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What percentage of confirmed reservations mention the word 'celebration' in the notes?", + "target_collection": "Reservations", + "search_query": "celebration", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "confirmed", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What percentage of confirmed reservations mention the word 'celebration' in the notes?", + "target_collection": "Reservations", + "search_query": "celebration", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "confirmed", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 30, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine in their description using search_query, and then group these restaurants by their averageRating.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine in their description using search_query, and then group these restaurants by their averageRating.", + "target_collection": "Restaurants", + "search_query": "restaurants with a cozy ambiance and Italian cuisine", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine in their description using search_query, and then group these restaurants by their averageRating.", + "target_collection": "Restaurants", + "search_query": "cozy ambiance Italian cuisine", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 31, + "database_schema_index": 0, + "natural_language_query": "Find restaurants described as having a cozy ambiance in their detailed description.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants described as having a cozy ambiance in their detailed description.", + "target_collection": "Restaurants", + "search_query": "{\"query\":\"Find restaurants with cozy ambiance.\"}", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants described as having a cozy ambiance in their detailed description.", + "target_collection": "Restaurants", + "search_query": "cozy ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 32, + "database_schema_index": 0, + "natural_language_query": "Find reservations where the partySize is greater than 4, group the results by reservationName, and calculate the average partySize for each reservationName group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find reservations where the partySize is greater than 4, group the results by reservationName, and calculate the average partySize for each reservationName group.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find reservations where the partySize is greater than 4, group the results by reservationName, and calculate the average partySize for each reservationName group.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 33, + "database_schema_index": 0, + "natural_language_query": "Find how many reservations have a partySize of at least 4 people and provide the total count.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find how many reservations have a partySize of at least 4 people and provide the total count.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find how many reservations have a partySize of at least 4 people and provide the total count.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 34, + "database_schema_index": 0, + "natural_language_query": "Show all reservations with a partySize of at least 5 people, count how many times each reservationName occurs, and group the results by whether the reservation is confirmed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Show all reservations with a partySize of at least 5 people, count how many times each reservationName occurs, and group the results by whether the reservation is confirmed.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "confirmed" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show all reservations with a partySize of at least 5 people, count how many times each reservationName occurs, and group the results by whether the reservation is confirmed.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "reservationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "confirmed", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 35, + "database_schema_index": 0, + "natural_language_query": "Find all menu items with a price less than $20 and determine the top 3 most common menuItem names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find all menu items with a price less than $20 and determine the top 3 most common menuItem names.", + "target_collection": "Menus", + "search_query": null, + "integer_property_filter": { + "property_name": "price", + "operator": "<", + "value": 20.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "menuItem", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all menu items with a price less than $20 and determine the top 3 most common menuItem names.", + "target_collection": "Menu_items", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "price", + "operator": "<", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "menuItem", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 36, + "database_schema_index": 0, + "natural_language_query": "Find reservations that have at least 5 people in partySize, aggregate them by counting the number of true values in the confirmed status, and group the results by reservationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find reservations that have at least 5 people in partySize, aggregate them by counting the number of true values in the confirmed status, and group the results by reservationName.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find reservations that have at least 5 people in partySize, aggregate them by counting the number of true values in the confirmed status, and group the results by reservationName.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "confirmed", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "reservationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 37, + "database_schema_index": 0, + "natural_language_query": "Find all reservations where there are more than 4 people in the partySize and count how many of these reservations are confirmed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find all reservations where there are more than 4 people in the partySize and count how many of these reservations are confirmed.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all reservations where there are more than 4 people in the partySize and count how many of these reservations are confirmed.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isConfirmed", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 38, + "database_schema_index": 0, + "natural_language_query": "Find reservations where the partySize is at least 4 and group the results by whether the reservation is confirmed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find reservations where the partySize is at least 4 and group the results by whether the reservation is confirmed.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "confirmed" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find reservations where the partySize is at least 4 and group the results by whether the reservation is confirmed.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "isConfirmed", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 39, + "database_schema_index": 0, + "natural_language_query": "Find all reservations with a partySize that is at least 5", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find all reservations with a partySize that is at least 5", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all reservations with a partySize that is at least 5", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 40, + "database_schema_index": 0, + "natural_language_query": "Find Italian restaurants by filtering descriptions that contain the word 'Italian', then calculate the average rating of these restaurants, and group results by whether they are currently open now.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find Italian restaurants by filtering descriptions that contain the word 'Italian', then calculate the average rating of these restaurants, and group results by whether they are currently open now.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "Italian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find Italian restaurants by filtering descriptions that contain the word 'Italian', then calculate the average rating of these restaurants, and group results by whether they are currently open now.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "Italian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 41, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with the word 'vegan' in their description and count how many such restaurants exist.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with the word 'vegan' in their description and count how many such restaurants exist.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "%vegan%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 42, + "database_schema_index": 0, + "natural_language_query": "Retrieve the count of restaurants containing 'Italian' in the description, group them by the openNow status, and provide the count of each restaurant name within those groups.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Retrieve the count of restaurants containing 'Italian' in the description, group them by the openNow status, and provide the count of each restaurant name within those groups.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "%Italian%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Retrieve the count of restaurants containing 'Italian' in the description, group them by the openNow status, and provide the count of each restaurant name within those groups.", + "target_collection": "Restaurants", + "search_query": "Italian", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 43, + "database_schema_index": 0, + "natural_language_query": "Find menu items with descriptions containing the word 'spicy' and determine the top three most common item names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find menu items with descriptions containing the word 'spicy' and determine the top three most common item names.", + "target_collection": "Menus", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "itemDescription", + "operator": "LIKE", + "value": "spicy" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "menuItem", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find menu items with descriptions containing the word 'spicy' and determine the top three most common item names.", + "target_collection": "MenuItems", + "search_query": "spicy", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "itemName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 44, + "database_schema_index": 0, + "natural_language_query": "Find reservations that mention 'birthday' in their notes, count how many of these reservations are confirmed, and group the results by the name under which each reservation is made.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find reservations that mention 'birthday' in their notes, count how many of these reservations are confirmed, and group the results by the name under which each reservation is made.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "notes", + "operator": "LIKE", + "value": "%birthday%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find reservations that mention 'birthday' in their notes, count how many of these reservations are confirmed, and group the results by the name under which each reservation is made.", + "target_collection": "Reservations", + "search_query": "birthday", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "confirmed", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "reservationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 45, + "database_schema_index": 0, + "natural_language_query": "Find all restaurants that mention 'vegan' in their description and count how many are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find all restaurants that mention 'vegan' in their description and count how many are currently open.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "vegan" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all restaurants that mention 'vegan' in their description and count how many are currently open.", + "target_collection": "Restaurants", + "search_query": "vegan", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 46, + "database_schema_index": 0, + "natural_language_query": "Find restaurants where the description contains 'Italian cuisine' and group these results by their name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants where the description contains 'Italian cuisine' and group these results by their name.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "Italian cuisine" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants where the description contains 'Italian cuisine' and group these results by their name.", + "target_collection": "Restaurants", + "search_query": "Italian cuisine", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 47, + "database_schema_index": 0, + "natural_language_query": "Find restaurants in the Restaurants collection where the description contains the keyword 'Italian'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants in the Restaurants collection where the description contains the keyword 'Italian'.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "Italian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "No tool called" + }, + { + "query_index": 48, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that are currently open, group them by their averageRating, and calculate the mean averageRating for each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that are currently open, group them by their averageRating, and calculate the mean averageRating for each group.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that are currently open, group them by their averageRating, and calculate the mean averageRating for each group.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 49, + "database_schema_index": 0, + "natural_language_query": "Determine the average rating of all restaurants that are open now, filtering by the openNow property, and calculate the mean on the averageRating property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Determine the average rating of all restaurants that are open now, filtering by the openNow property, and calculate the mean on the averageRating property.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Determine the average rating of all restaurants that are open now, filtering by the openNow property, and calculate the mean on the averageRating property.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 50, + "database_schema_index": 0, + "natural_language_query": "What types of cuisines are available in restaurants that are currently open, grouped by their average rating?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What types of cuisines are available in restaurants that are currently open, grouped by their average rating?", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "What types of cuisines are available in restaurants that are currently open, grouped by their average rating?", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description.cuisine", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 51, + "database_schema_index": 0, + "natural_language_query": "Identify the most common cuisine type among all restaurants that are currently open (using 'openNow' property for filtering and 'description' property for text aggregation).", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Identify the most common cuisine type among all restaurants that are currently open (using 'openNow' property for filtering and 'description' property for text aggregation).", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify the most common cuisine type among all restaurants that are currently open (using 'openNow' property for filtering and 'description' property for text aggregation).", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description.cuisine", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 52, + "database_schema_index": 0, + "natural_language_query": "Calculate the percentage of restaurants that are currently open (openNow = true), and group these open restaurants by their averageRating to understand how many are open in each rating category.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Calculate the percentage of restaurants that are currently open (openNow = true), and group these open restaurants by their averageRating to understand how many are open in each rating category.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate the percentage of restaurants that are currently open (openNow = true), and group these open restaurants by their averageRating to understand how many are open in each rating category.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 53, + "database_schema_index": 0, + "natural_language_query": "Show me all confirmed reservations and count the total number of confirmed versus unconfirmed reservations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Show me all confirmed reservations and count the total number of confirmed versus unconfirmed reservations.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "confirmed", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Show me all confirmed reservations and count the total number of confirmed versus unconfirmed reservations.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "confirmed", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 54, + "database_schema_index": 0, + "natural_language_query": "Show all restaurants that are currently open (openNow = true), and group these by the type of cuisine mentioned in the description to see how many open restaurants exist for each cuisine type.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Show all restaurants that are currently open (openNow = true), and group these by the type of cuisine mentioned in the description to see how many open restaurants exist for each cuisine type.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "description" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show all restaurants that are currently open (openNow = true), and group these by the type of cuisine mentioned in the description to see how many open restaurants exist for each cuisine type.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "description.cuisine", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 55, + "database_schema_index": 0, + "natural_language_query": "Find restaurants where openNow is true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants where openNow is true.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants where openNow is true.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 56, + "database_schema_index": 0, + "natural_language_query": "Find the total party size for reservations grouped by reservationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find the total party size for reservations grouped by reservationName.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the total party size for reservations grouped by reservationName.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 57, + "database_schema_index": 0, + "natural_language_query": "Count the number of reservations based on their partySize.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Count the number of reservations based on their partySize.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Count the number of reservations based on their partySize.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "partySize", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 58, + "database_schema_index": 0, + "natural_language_query": "Find the types of cuisines mentioned most frequently in the restaurant descriptions, grouped by whether the restaurants are currently open or closed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find the types of cuisines mentioned most frequently in the restaurant descriptions, grouped by whether the restaurants are currently open or closed.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the types of cuisines mentioned most frequently in the restaurant descriptions, grouped by whether the restaurants are currently open or closed.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description.cuisine", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 59, + "database_schema_index": 0, + "natural_language_query": "What are the three most common phrases in the description of restaurants?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What are the three most common phrases in the description of restaurants?", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the three most common phrases in the description of restaurants?", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 60, + "database_schema_index": 0, + "natural_language_query": "Calculate the percentage of restaurants that are open now within each grouping by their average rating.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Calculate the percentage of restaurants that are open now within each grouping by their average rating.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate the percentage of restaurants that are open now within each grouping by their average rating.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 61, + "database_schema_index": 0, + "natural_language_query": "Calculate the percentage of menu items that are vegetarian based on the isVegetarian property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Calculate the percentage of menu items that are vegetarian based on the isVegetarian property.", + "target_collection": "Menus", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isVegetarian", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate the percentage of menu items that are vegetarian based on the isVegetarian property.", + "target_collection": "Menu_items", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isVegetarian", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 62, + "database_schema_index": 0, + "natural_language_query": "Group restaurants by their averageRating to analyze patterns across different rating categories, helping to understand how many restaurants fall into each rating group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Group restaurants by their averageRating to analyze patterns across different rating categories, helping to understand how many restaurants fall into each rating group.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Group restaurants by their averageRating to analyze patterns across different rating categories, helping to understand how many restaurants fall into each rating group.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 63, + "database_schema_index": 0, + "natural_language_query": "Identify clinics that specialize in pediatric care using semantic search, filter out only those with an averagePatientSatisfaction of 4.5 or higher, calculate the mean averagePatientSatisfaction, and group these results based on whether they are acceptingNewPatients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Identify clinics that specialize in pediatric care using semantic search, filter out only those with an averagePatientSatisfaction of 4.5 or higher, calculate the mean averagePatientSatisfaction, and group these results based on whether they are acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": "Find clinics that specialize in pediatric care", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify clinics that specialize in pediatric care using semantic search, filter out only those with an averagePatientSatisfaction of 4.5 or higher, calculate the mean averagePatientSatisfaction, and group these results based on whether they are acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": "pediatric care", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 64, + "database_schema_index": 1, + "natural_language_query": "Retrieve clinics with descriptions including 'comprehensive healthcare', having averagePatientSatisfaction greater than 4.5, and count how many of these clinics are acceptingNewPatients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Retrieve clinics with descriptions including 'comprehensive healthcare', having averagePatientSatisfaction greater than 4.5, and count how many of these clinics are acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": "Find clinics whose description includes comprehensive healthcare", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Retrieve clinics with descriptions including 'comprehensive healthcare', having averagePatientSatisfaction greater than 4.5, and count how many of these clinics are acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": "comprehensive healthcare", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 65, + "database_schema_index": 1, + "natural_language_query": "Find clinics related to cardiology with average patient satisfaction higher than 4. Resulting clinics should be grouped based on whether they are accepting new patients or not, and within each group, identify the top 5 most common service descriptions.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics related to cardiology with average patient satisfaction higher than 4. Resulting clinics should be grouped based on whether they are accepting new patients or not, and within each group, identify the top 5 most common service descriptions.", + "target_collection": "Clinics", + "search_query": "cardiology", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics related to cardiology with average patient satisfaction higher than 4. Resulting clinics should be grouped based on whether they are accepting new patients or not, and within each group, identify the top 5 most common service descriptions.", + "target_collection": "Clinics", + "search_query": "cardiology", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "serviceDescription", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 66, + "database_schema_index": 1, + "natural_language_query": "Find doctors with expertise related to dermatology and skin care, who have at least 10 years of experience, and retrieve the top 3 most common doctor names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors with expertise related to dermatology and skin care, who have at least 10 years of experience, and retrieve the top 3 most common doctor names.", + "target_collection": "Doctors", + "search_query": "Find doctors with expertise related to dermatology and skin care", + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "doctorName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors with expertise related to dermatology and skin care, who have at least 10 years of experience, and retrieve the top 3 most common doctor names.", + "target_collection": "Doctors", + "search_query": "expertise related to dermatology and skin care", + "limit": 5, + "integer_property_filter": { + "property_name": "years_of_experience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9, + "error": null + }, + { + "query_index": 67, + "database_schema_index": 1, + "natural_language_query": "Find clinics specialized in cardiovascular healthcare by searching \"description\"; filter these to only show clinics with an \"averagePatientSatisfaction\" greater than 4.5; determine the percentage of these clinics \"acceptingNewPatients\"; and finally, organize the results by \"clinicName\".", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics specialized in cardiovascular healthcare by searching \"description\"; filter these to only show clinics with an \"averagePatientSatisfaction\" greater than 4.5; determine the percentage of these clinics \"acceptingNewPatients\"; and finally, organize the results by \"clinicName\".", + "target_collection": "Clinics", + "search_query": "Find clinics that are specialized in cardiovascular healthcare.", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics specialized in cardiovascular healthcare by searching \"description\"; filter these to only show clinics with an \"averagePatientSatisfaction\" greater than 4.5; determine the percentage of these clinics \"acceptingNewPatients\"; and finally, organize the results by \"clinicName\".", + "target_collection": "Clinics", + "search_query": "cardiovascular healthcare", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 68, + "database_schema_index": 1, + "natural_language_query": "Find clinics offering pediatric services with an average patient satisfaction score greater than 4, and count the total number of clinics that are currently accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics offering pediatric services with an average patient satisfaction score greater than 4, and count the total number of clinics that are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "Find clinics offering pediatric services", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics offering pediatric services with an average patient satisfaction score greater than 4, and count the total number of clinics that are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "pediatric services", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfactionScore", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.925, + "error": null + }, + { + "query_index": 69, + "database_schema_index": 1, + "natural_language_query": "Find doctors who specialize in neurology with more than 10 years of experience, and group the results by whether they are currently practicing or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors who specialize in neurology with more than 10 years of experience, and group the results by whether they are currently practicing or not.", + "target_collection": "Doctors", + "search_query": "Find doctors who specialize in neurology", + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors who specialize in neurology with more than 10 years of experience, and group the results by whether they are currently practicing or not.", + "target_collection": "Doctors", + "search_query": "specialize in neurology", + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 70, + "database_schema_index": 1, + "natural_language_query": "Find clinics with a description similar to 'pediatric care' that have an averagePatientSatisfaction score of at least 4.5.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics with a description similar to 'pediatric care' that have an averagePatientSatisfaction score of at least 4.5.", + "target_collection": "Clinics", + "search_query": "pediatric care", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics with a description similar to 'pediatric care' that have an averagePatientSatisfaction score of at least 4.5.", + "target_collection": "Clinics", + "search_query": "pediatric care", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 71, + "database_schema_index": 1, + "natural_language_query": "Identify clinics that offer dental services by performing a search for relevant specialties, filter specifically for a clinic named Sunny Clinic, determine the maximum average patient satisfaction score, and group the results based on whether they are accepting new patients or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Identify clinics that offer dental services by performing a search for relevant specialties, filter specifically for a clinic named Sunny Clinic, determine the maximum average patient satisfaction score, and group the results based on whether they are accepting new patients or not.", + "target_collection": "Clinics", + "search_query": "Find clinics that offer dental services and check their specialties", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "Sunny Clinic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify clinics that offer dental services by performing a search for relevant specialties, filter specifically for a clinic named Sunny Clinic, determine the maximum average patient satisfaction score, and group the results based on whether they are accepting new patients or not.", + "target_collection": "Clinics", + "search_query": "dental services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Sunny Clinic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfactionScore", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9, + "error": null + }, + { + "query_index": 72, + "database_schema_index": 1, + "natural_language_query": "Find clinics with a description similar to 'clinic with specialties in cardiology and pediatric care', where the clinicName is exactly 'City Health Center', and calculate the average of averagePatientSatisfaction for these clinics.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics with a description similar to 'clinic with specialties in cardiology and pediatric care', where the clinicName is exactly 'City Health Center', and calculate the average of averagePatientSatisfaction for these clinics.", + "target_collection": "Clinics", + "search_query": "clinic with specialties in cardiology and pediatric care", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "City Health Center" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics with a description similar to 'clinic with specialties in cardiology and pediatric care', where the clinicName is exactly 'City Health Center', and calculate the average of averagePatientSatisfaction for these clinics.", + "target_collection": "Clinics", + "search_query": "clinic with specialties in cardiology and pediatric care", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "City Health Center" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 73, + "database_schema_index": 1, + "natural_language_query": "Find clinics that offer family healthcare services using semantic search, and are accepting new patients. Count the number of unique clinics and group them by average patient satisfaction score.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that offer family healthcare services using semantic search, and are accepting new patients. Count the number of unique clinics and group them by average patient satisfaction score.", + "target_collection": "Clinics", + "search_query": "Family healthcare services", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that offer family healthcare services using semantic search, and are accepting new patients. Count the number of unique clinics and group them by average patient satisfaction score.", + "target_collection": "Clinics", + "search_query": "family healthcare services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfactionScore", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 74, + "database_schema_index": 1, + "natural_language_query": "Find clinics that describe themselves as offering holistic healthcare services, filter those with 'Health' in their clinicName, and identify the top 3 most frequently occurring clinic names from those results.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that describe themselves as offering holistic healthcare services, filter those with 'Health' in their clinicName, and identify the top 3 most frequently occurring clinic names from those results.", + "target_collection": "Clinics", + "search_query": "Find clinics that offer holistic healthcare services based on detailed description", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "LIKE", + "value": "%Health%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "clinicName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that describe themselves as offering holistic healthcare services, filter those with 'Health' in their clinicName, and identify the top 3 most frequently occurring clinic names from those results.", + "target_collection": "Clinics", + "search_query": "holistic healthcare services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "LIKE", + "value": "%Health%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "clinicName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 75, + "database_schema_index": 1, + "natural_language_query": "Find the best clinics known for pediatric services, where clinic names start with 'A', group them by average patient satisfaction, and count how many are accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find the best clinics known for pediatric services, where clinic names start with 'A', group them by average patient satisfaction, and count how many are accepting new patients.", + "target_collection": "Clinics", + "search_query": "Find the best clinics known for pediatric services", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "LIKE", + "value": "A%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the best clinics known for pediatric services, where clinic names start with 'A', group them by average patient satisfaction, and count how many are accepting new patients.", + "target_collection": "Clinics", + "search_query": "pediatric services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "A%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "averagePatientSatisfaction", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 76, + "database_schema_index": 1, + "natural_language_query": "Find appointments related to annual health check-ups by searching in appointmentNotes for 'check-up', and count how many of these appointments are confirmed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find appointments related to annual health check-ups by searching in appointmentNotes for 'check-up', and count how many of these appointments are confirmed.", + "target_collection": "Appointments", + "search_query": "Find the appointments that are relevant to annual health check-ups", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "appointmentNotes", + "operator": "LIKE", + "value": "check-up" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find appointments related to annual health check-ups by searching in appointmentNotes for 'check-up', and count how many of these appointments are confirmed.", + "target_collection": "Appointments", + "search_query": "check-up", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "confirmed", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 77, + "database_schema_index": 1, + "natural_language_query": "Search for clinics that have descriptions mentioning advanced medical technology, filter by the clinic name \"Healthcare Plus Clinic\", and group the results by whether they are accepting new patients, aggregating average patient satisfaction scores within each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Search for clinics that have descriptions mentioning advanced medical technology, filter by the clinic name \"Healthcare Plus Clinic\", and group the results by whether they are accepting new patients, aggregating average patient satisfaction scores within each group.", + "target_collection": "Clinics", + "search_query": "Find clinics whose description includes advanced medical technology.", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "Healthcare Plus Clinic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for clinics that have descriptions mentioning advanced medical technology, filter by the clinic name \"Healthcare Plus Clinic\", and group the results by whether they are accepting new patients, aggregating average patient satisfaction scores within each group.", + "target_collection": "Clinics", + "search_query": "advanced medical technology", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Healthcare Plus Clinic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "patientSatisfactionScore", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 78, + "database_schema_index": 1, + "natural_language_query": "Search for clinics whose description indicates a focus on comprehensive dermatology services and skin care treatments, and filter to include only those clinics with 'Dermatology' in their clinicName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Search for clinics whose description indicates a focus on comprehensive dermatology services and skin care treatments, and filter to include only those clinics with 'Dermatology' in their clinicName.", + "target_collection": "Clinics", + "search_query": "Find clinics that provide comprehensive dermatology services and skin care treatments", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "LIKE", + "value": "*Dermatology*" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for clinics whose description indicates a focus on comprehensive dermatology services and skin care treatments, and filter to include only those clinics with 'Dermatology' in their clinicName.", + "target_collection": "Clinics", + "search_query": "comprehensive dermatology services and skin care treatments", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "LIKE", + "value": "%Dermatology%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 79, + "database_schema_index": 1, + "natural_language_query": "Find clinics based on a high patient satisfaction, filter to include only those currently accepting new patients, perform an average calculation of the averagePatientSatisfaction, and group the results by clinic name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics based on a high patient satisfaction, filter to include only those currently accepting new patients, perform an average calculation of the averagePatientSatisfaction, and group the results by clinic name.", + "target_collection": "Clinics", + "search_query": "high patient satisfaction", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics based on a high patient satisfaction, filter to include only those currently accepting new patients, perform an average calculation of the averagePatientSatisfaction, and group the results by clinic name.", + "target_collection": "Clinics", + "search_query": "high patient satisfaction", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 80, + "database_schema_index": 1, + "natural_language_query": "Find clinics that are conceptually related to pediatrics, are accepting new patients, and calculate the mean average patient satisfaction score across all such clinics.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that are conceptually related to pediatrics, are accepting new patients, and calculate the mean average patient satisfaction score across all such clinics.", + "target_collection": "Clinics", + "search_query": "pediatrics", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that are conceptually related to pediatrics, are accepting new patients, and calculate the mean average patient satisfaction score across all such clinics.", + "target_collection": "Clinics", + "search_query": "pediatrics", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfactionScore", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 81, + "database_schema_index": 1, + "natural_language_query": "Find doctors with expertise in cardiology who are currently practicing, show how many doctors there are per expertise, and group them by their expertise category.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors with expertise in cardiology who are currently practicing, show how many doctors there are per expertise, and group them by their expertise category.", + "target_collection": "Doctors", + "search_query": "Find doctors with expertise in 'cardiology'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyPracticing", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "expertise" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors with expertise in cardiology who are currently practicing, show how many doctors there are per expertise, and group them by their expertise category.", + "target_collection": "Doctors", + "search_query": "expertise in cardiology", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyPracticing", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "expertiseCategory", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 82, + "database_schema_index": 1, + "natural_language_query": "Find clinics that match specific healthcare needs and services, filter to show only those accepting new patients, and aggregate to find the top 5 most common descriptions of these clinics.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that match specific healthcare needs and services, filter to show only those accepting new patients, and aggregate to find the top 5 most common descriptions of these clinics.", + "target_collection": "Clinics", + "search_query": "Find clinics that provide specialties or services mentioned in the search", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that match specific healthcare needs and services, filter to show only those accepting new patients, and aggregate to find the top 5 most common descriptions of these clinics.", + "target_collection": "Clinics", + "search_query": "specific healthcare needs and services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 83, + "database_schema_index": 1, + "natural_language_query": "Identify clinics that provide cardiology services (using descriptions for search), determine which of them are currently accepting new patients, and count the number of clinics within each range of average patient satisfaction scores.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Identify clinics that provide cardiology services (using descriptions for search), determine which of them are currently accepting new patients, and count the number of clinics within each range of average patient satisfaction scores.", + "target_collection": "Clinics", + "search_query": "Find clinics offering cardiology services", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify clinics that provide cardiology services (using descriptions for search), determine which of them are currently accepting new patients, and count the number of clinics within each range of average patient satisfaction scores.", + "target_collection": "Clinics", + "search_query": "cardiology services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 84, + "database_schema_index": 1, + "natural_language_query": "Find clinics that match the concept of 'family healthcare services', filter those that are accepting new patients, and calculate the percentage of clinics that are accepting new patients among the total results.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that match the concept of 'family healthcare services', filter those that are accepting new patients, and calculate the percentage of clinics that are accepting new patients among the total results.", + "target_collection": "Clinics", + "search_query": "Find clinics that match the concept of 'family healthcare services'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that match the concept of 'family healthcare services', filter those that are accepting new patients, and calculate the percentage of clinics that are accepting new patients among the total results.", + "target_collection": "Clinics", + "search_query": "family healthcare services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 85, + "database_schema_index": 1, + "natural_language_query": "Find clinics that specialize in pediatric care and are accepting new patients, then group the results by their average patient satisfaction score.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that specialize in pediatric care and are accepting new patients, then group the results by their average patient satisfaction score.", + "target_collection": "Clinics", + "search_query": "Find clinics that specialize in pediatric care", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that specialize in pediatric care and are accepting new patients, then group the results by their average patient satisfaction score.", + "target_collection": "Clinics", + "search_query": "pediatric care", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfactionScore", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 86, + "database_schema_index": 1, + "natural_language_query": "Find clinics that specialize in cardiac care based on their description and are currently accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that specialize in cardiac care based on their description and are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "Find clinics that specialize in cardiac care based on their description", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that specialize in cardiac care based on their description and are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "cardiac care", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 87, + "database_schema_index": 1, + "natural_language_query": "List clinics that provide excellent healthcare services. Within these clinics, group them by their clinic names and count how many are currently accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "List clinics that provide excellent healthcare services. Within these clinics, group them by their clinic names and count how many are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "Find clinics that match the description of providing excellent healthcare services with high specialties", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "List clinics that provide excellent healthcare services. Within these clinics, group them by their clinic names and count how many are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "excellent healthcare services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 88, + "database_schema_index": 1, + "natural_language_query": "Find doctors in the Doctors collection specializing in 'cardiology' based on their expertise property, and calculate the mean yearsOfExperience for these doctors.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors in the Doctors collection specializing in 'cardiology' based on their expertise property, and calculate the mean yearsOfExperience for these doctors.", + "target_collection": "Doctors", + "search_query": "Find doctors specializing in cardiology", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors in the Doctors collection specializing in 'cardiology' based on their expertise property, and calculate the mean yearsOfExperience for these doctors.", + "target_collection": "Doctors", + "search_query": "cardiology", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 89, + "database_schema_index": 1, + "natural_language_query": "Find clinics that provide 'dental services', group them by whether they are accepting new patients, and count how many clinics are in each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that provide 'dental services', group them by whether they are accepting new patients, and count how many clinics are in each group.", + "target_collection": "Clinics", + "search_query": "Find clinics providing 'dental services'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 90, + "database_schema_index": 1, + "natural_language_query": "Find clinics offering high-quality healthcare services based on their description, and count the number of unique clinic names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics offering high-quality healthcare services based on their description, and count the number of unique clinic names.", + "target_collection": "Clinics", + "search_query": "High-quality healthcare services", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics offering high-quality healthcare services based on their description, and count the number of unique clinic names.", + "target_collection": "Clinics", + "search_query": "high-quality healthcare services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 91, + "database_schema_index": 1, + "natural_language_query": "Search for clinics where the description mentions specific healthcare services you need, determine what percentage of these clinics are accepting new patients, and group the results by clinicName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Search for clinics where the description mentions specific healthcare services you need, determine what percentage of these clinics are accepting new patients, and group the results by clinicName.", + "target_collection": "Clinics", + "search_query": "Find clinics with descriptions similar to healthcare services or specialties you need", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for clinics where the description mentions specific healthcare services you need, determine what percentage of these clinics are accepting new patients, and group the results by clinicName.", + "target_collection": "Clinics", + "search_query": "specific healthcare services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 92, + "database_schema_index": 1, + "natural_language_query": "How many clinics that offer pediatrics and family healthcare are currently accepting new patients?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "How many clinics that offer pediatrics and family healthcare are currently accepting new patients?", + "target_collection": "Clinics", + "search_query": "Find clinics that offer pediatrics and family healthcare", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "How many clinics that offer pediatrics and family healthcare are currently accepting new patients?", + "target_collection": "Clinics", + "search_query": "offer pediatrics and family healthcare", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 93, + "database_schema_index": 1, + "natural_language_query": "Find clinics that specialize in pediatric services, offer state-of-the-art facilities, and have high ratings for patient care experience, and then group these clinics based on whether they are accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that specialize in pediatric services, offer state-of-the-art facilities, and have high ratings for patient care experience, and then group these clinics based on whether they are accepting new patients.", + "target_collection": "Clinics", + "search_query": "Find clinics that specialize in pediatric services, offer state-of-the-art facilities, and have high ratings for patient care experience", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that specialize in pediatric services, offer state-of-the-art facilities, and have high ratings for patient care experience, and then group these clinics based on whether they are accepting new patients.", + "target_collection": "Clinics", + "search_query": "pediatric services, state-of-the-art facilities, high ratings for patient care experience", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 94, + "database_schema_index": 1, + "natural_language_query": "What clinics are recognized for their exceptional orthopedic services and a high emphasis on patient care?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "What clinics are recognized for their exceptional orthopedic services and a high emphasis on patient care?", + "target_collection": "Clinics", + "search_query": "Find clinics that are renowned for exceptional orthopedic services and have a high focus on patient care.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What clinics are recognized for their exceptional orthopedic services and a high emphasis on patient care?", + "target_collection": "Clinics", + "search_query": "exceptional orthopedic services and a high emphasis on patient care", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 95, + "database_schema_index": 1, + "natural_language_query": "Find doctors with more than 10 yearsOfExperience, calculate the average yearsOfExperience for these doctors, and group the results by whether they are currentlyPracticing or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors with more than 10 yearsOfExperience, calculate the average yearsOfExperience for these doctors, and group the results by whether they are currentlyPracticing or not.", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors with more than 10 yearsOfExperience, calculate the average yearsOfExperience for these doctors, and group the results by whether they are currentlyPracticing or not.", + "target_collection": "Doctors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 96, + "database_schema_index": 1, + "natural_language_query": "Find the number of clinics where the averagePatientSatisfaction score is at least 4.5", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find the number of clinics where the averagePatientSatisfaction score is at least 4.5", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the number of clinics where the averagePatientSatisfaction score is at least 4.5", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 97, + "database_schema_index": 1, + "natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5, then group results by acceptingNewPatients status and determine the top 3 most common specialties within each group's description.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5, then group results by acceptingNewPatients status and determine the top 3 most common specialties within each group's description.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5, then group results by acceptingNewPatients status and determine the top 3 most common specialties within each group's description.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description.specialties", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 98, + "database_schema_index": 1, + "natural_language_query": "Find appointments that have an appointmentDuration of at least 30 minutes and determine the most common patientName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find appointments that have an appointmentDuration of at least 30 minutes and determine the most common patientName.", + "target_collection": "Appointments", + "search_query": null, + "integer_property_filter": { + "property_name": "appointmentDuration", + "operator": ">=", + "value": 30 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "patientName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find appointments that have an appointmentDuration of at least 30 minutes and determine the most common patientName.", + "target_collection": "Appointments", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "appointmentDuration", + "operator": ">=", + "value": 30 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "patientName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 99, + "database_schema_index": 1, + "natural_language_query": "Group clinics by their clinicName, but only include those with an averagePatientSatisfaction of at least 4.5, and count how many of these clinics are currently accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Group clinics by their clinicName, but only include those with an averagePatientSatisfaction of at least 4.5, and count how many of these clinics are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Group clinics by their clinicName, but only include those with an averagePatientSatisfaction of at least 4.5, and count how many of these clinics are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 100, + "database_schema_index": 1, + "natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5 and count how many of these clinics are currently acceptingNewPatients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5 and count how many of these clinics are currently acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5 and count how many of these clinics are currently acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 101, + "database_schema_index": 1, + "natural_language_query": "Find doctors with at least 10 years of experience and group results by whether they are currently practicing.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors with at least 10 years of experience and group results by whether they are currently practicing.", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors with at least 10 years of experience and group results by whether they are currently practicing.", + "target_collection": "Doctors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "years_of_experience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currently_practicing", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 102, + "database_schema_index": 1, + "natural_language_query": "Find doctors who have more than 10 years in yearsOfExperience", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors who have more than 10 years in yearsOfExperience", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors who have more than 10 years in yearsOfExperience", + "target_collection": "Doctors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 103, + "database_schema_index": 1, + "natural_language_query": "Find all clinics where the description contains the keyword 'specialty', group them by their acceptingNewPatients status, and calculate the maximum averagePatientSatisfaction score for each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find all clinics where the description contains the keyword 'specialty', group them by their acceptingNewPatients status, and calculate the maximum averagePatientSatisfaction score for each group.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "specialty" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all clinics where the description contains the keyword 'specialty', group them by their acceptingNewPatients status, and calculate the maximum averagePatientSatisfaction score for each group.", + "target_collection": "Clinics", + "search_query": "specialty", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 104, + "database_schema_index": 1, + "natural_language_query": "How many appointments have the word 'consultation' in their appointmentNotes and what is their total count for appointmentDuration?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "How many appointments have the word 'consultation' in their appointmentNotes and what is their total count for appointmentDuration?", + "target_collection": "Appointments", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "appointmentNotes", + "operator": "LIKE", + "value": "consultation" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "How many appointments have the word 'consultation' in their appointmentNotes and what is their total count for appointmentDuration?", + "target_collection": "Appointments", + "search_query": "consultation", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "appointmentDuration", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 105, + "database_schema_index": 1, + "natural_language_query": "Identify how many different averagePatientSatisfaction scores exist for clinics whose description includes the term 'multispecialty', grouped by the description property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Identify how many different averagePatientSatisfaction scores exist for clinics whose description includes the term 'multispecialty', grouped by the description property.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "multispecialty" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "description" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify how many different averagePatientSatisfaction scores exist for clinics whose description includes the term 'multispecialty', grouped by the description property.", + "target_collection": "Clinics", + "search_query": "multispecialty", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MODE" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "description", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 106, + "database_schema_index": 1, + "natural_language_query": "Find the number of unique clinicName values from the Clinics collection where the description contains the word 'dental' by counting these occurrences.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find the number of unique clinicName values from the Clinics collection where the description contains the word 'dental' by counting these occurrences.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "%dental%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the number of unique clinicName values from the Clinics collection where the description contains the word 'dental' by counting these occurrences.", + "target_collection": "Clinics", + "search_query": "dental", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "clinicName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 107, + "database_schema_index": 1, + "natural_language_query": "Show the percentage of clinics accepting new patients, grouped by clinicName, where the clinic's description contains the word pediatrics.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Show the percentage of clinics accepting new patients, grouped by clinicName, where the clinic's description contains the word pediatrics.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "pediatrics" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show the percentage of clinics accepting new patients, grouped by clinicName, where the clinic's description contains the word pediatrics.", + "target_collection": "Clinics", + "search_query": "pediatrics", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 108, + "database_schema_index": 1, + "natural_language_query": "Find clinics where the description includes 'cancer', and determine how many of these clinics are accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics where the description includes 'cancer', and determine how many of these clinics are accepting new patients.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "%cancer%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics where the description includes 'cancer', and determine how many of these clinics are accepting new patients.", + "target_collection": "Clinics", + "search_query": "cancer", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 109, + "database_schema_index": 1, + "natural_language_query": "Find clinics that have 'pediatrics' in their description, and group them by whether they are accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that have 'pediatrics' in their description, and group them by whether they are accepting new patients.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "pediatrics" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that have 'pediatrics' in their description, and group them by whether they are accepting new patients.", + "target_collection": "Clinics", + "search_query": "pediatrics", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 110, + "database_schema_index": 1, + "natural_language_query": "Retrieve the clinic that has the exact clinicName 'Community HealthCare Center'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Retrieve the clinic that has the exact clinicName 'Community HealthCare Center'.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "Community HealthCare Center" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Retrieve the clinic that has the exact clinicName 'Community HealthCare Center'.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "Community HealthCare Center" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 111, + "database_schema_index": 1, + "natural_language_query": "For clinics that are accepting new patients, calculate the mean averagePatientSatisfaction score for each category described by 'description'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "For clinics that are accepting new patients, calculate the mean averagePatientSatisfaction score for each category described by 'description'.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "description" + }, + "predicted_query": { + "corresponding_natural_language_query": "For clinics that are accepting new patients, calculate the mean averagePatientSatisfaction score for each category described by 'description'.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "accepting_new_patients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "description", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 112, + "database_schema_index": 1, + "natural_language_query": "Find clinics that are accepting new patients and calculate the mean of averagePatientSatisfaction scores for those clinics.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that are accepting new patients and calculate the mean of averagePatientSatisfaction scores for those clinics.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that are accepting new patients and calculate the mean of averagePatientSatisfaction scores for those clinics.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 113, + "database_schema_index": 1, + "natural_language_query": "Find clinics that are accepting new patients (using 'acceptingNewPatients' with true value), group the results by clinicName, and aggregate to count the occurrences of each clinic name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that are accepting new patients (using 'acceptingNewPatients' with true value), group the results by clinicName, and aggregate to count the occurrences of each clinic name.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that are accepting new patients (using 'acceptingNewPatients' with true value), group the results by clinicName, and aggregate to count the occurrences of each clinic name.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "clinicName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 114, + "database_schema_index": 1, + "natural_language_query": "Find all clinics where acceptingNewPatients is true, and count how many different clinics share the same description.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find all clinics where acceptingNewPatients is true, and count how many different clinics share the same description.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all clinics where acceptingNewPatients is true, and count how many different clinics share the same description.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "description", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 115, + "database_schema_index": 1, + "natural_language_query": "Find and display the percentage of clinics that are currently accepting new patients, grouped by each clinic's name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find and display the percentage of clinics that are currently accepting new patients, grouped by each clinic's name.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find and display the percentage of clinics that are currently accepting new patients, grouped by each clinic's name.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 116, + "database_schema_index": 1, + "natural_language_query": "Find all appointments where appointmentConfirmed is false and also count the total number of appointments based on appointmentConfirmed status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find all appointments where appointmentConfirmed is false and also count the total number of appointments based on appointmentConfirmed status.", + "target_collection": "Appointments", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "appointmentConfirmed", + "operator": "=", + "value": false + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all appointments where appointmentConfirmed is false and also count the total number of appointments based on appointmentConfirmed status.", + "target_collection": "Appointments", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "appointmentConfirmed", + "operator": "=", + "value": false + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "appointmentConfirmed", + "metrics": "TOTAL_FALSE" + }, + "groupby_property": "appointmentConfirmed", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 117, + "database_schema_index": 1, + "natural_language_query": "Find all clinics that are accepting new patients and group them by clinicName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find all clinics that are accepting new patients and group them by clinicName.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all clinics that are accepting new patients and group them by clinicName.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 118, + "database_schema_index": 1, + "natural_language_query": "Find clinics where acceptingNewPatients is equal to true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics where acceptingNewPatients is equal to true.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics where acceptingNewPatients is equal to true.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 119, + "database_schema_index": 1, + "natural_language_query": "Determine the mean years of experience for doctors, categorized by their expertise.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Determine the mean years of experience for doctors, categorized by their expertise.", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "expertise" + }, + "predicted_query": { + "corresponding_natural_language_query": "Determine the mean years of experience for doctors, categorized by their expertise.", + "target_collection": "Doctors", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "expertise", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 120, + "database_schema_index": 1, + "natural_language_query": "Using the int_property_aggregation operator, calculate the total number of years of experience across all doctors by summing the 'yearsOfExperience' property in the Doctors collection.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Using the int_property_aggregation operator, calculate the total number of years of experience across all doctors by summing the 'yearsOfExperience' property in the Doctors collection.", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Using the int_property_aggregation operator, calculate the total number of years of experience across all doctors by summing the 'yearsOfExperience' property in the Doctors collection.", + "target_collection": "Doctors", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 121, + "database_schema_index": 1, + "natural_language_query": "What are the top 5 most common areas of expertise for doctors, grouped by whether they are currently practicing?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "What are the top 5 most common areas of expertise for doctors, grouped by whether they are currently practicing?", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "expertise", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the top 5 most common areas of expertise for doctors, grouped by whether they are currently practicing?", + "target_collection": "Doctors", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "areasOfExpertise", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 122, + "database_schema_index": 1, + "natural_language_query": "What are the top 5 most common clinicName entries in the Clinics collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "What are the top 5 most common clinicName entries in the Clinics collection?", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "clinicName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the top 5 most common clinicName entries in the Clinics collection?", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "clinicName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 123, + "database_schema_index": 1, + "natural_language_query": "Calculate the percentage of clinics that are accepting new patients, grouped by their average patient satisfaction.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Calculate the percentage of clinics that are accepting new patients, grouped by their average patient satisfaction.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate the percentage of clinics that are accepting new patients, grouped by their average patient satisfaction.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averagePatientSatisfaction", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 124, + "database_schema_index": 1, + "natural_language_query": "How many clinics are currently accepting new patients compared to those that are not?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "How many clinics are currently accepting new patients compared to those that are not?", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "How many clinics are currently accepting new patients compared to those that are not?", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 125, + "database_schema_index": 1, + "natural_language_query": "Group clinics by their averagePatientSatisfaction scores to see the distribution of clinics based on patient satisfaction levels, organizing the results into different satisfaction categories.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Group clinics by their averagePatientSatisfaction scores to see the distribution of clinics based on patient satisfaction levels, organizing the results into different satisfaction categories.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": { + "corresponding_natural_language_query": "Group clinics by their averagePatientSatisfaction scores to see the distribution of clinics based on patient satisfaction levels, organizing the results into different satisfaction categories.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 126, + "database_schema_index": 1, + "natural_language_query": "Show me students interested in 'learning algorithms' who have completed more than 20 completedCredits, aggregate the count of completedCredits for these students, and group the results by their enrolledFullTime status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Show me students interested in 'learning algorithms' who have completed more than 20 completedCredits, aggregate the count of completedCredits for these students, and group the results by their enrolledFullTime status.", + "target_collection": "Students", + "search_query": "learning algorithms", + "integer_property_filter": { + "property_name": "completedCredits", + "operator": ">", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "enrolledFullTime" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show me students interested in 'learning algorithms' who have completed more than 20 completedCredits, aggregate the count of completedCredits for these students, and group the results by their enrolledFullTime status.", + "target_collection": "Students", + "search_query": "learning algorithms", + "limit": 5, + "integer_property_filter": { + "property_name": "completedCredits", + "operator": ">", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "completedCredits", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "enrolledFullTime", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 127, + "database_schema_index": 1, + "natural_language_query": "Find students whose researchInterests include machine learning, filter those who have completedCredits of at least 30, and calculate the average completedCredits of these students.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find students whose researchInterests include machine learning, filter those who have completedCredits of at least 30, and calculate the average completedCredits of these students.", + "target_collection": "Students", + "search_query": "Find students whose researchInterests include machine learning", + "integer_property_filter": { + "property_name": "completedCredits", + "operator": ">=", + "value": 30 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "completedCredits", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find students whose researchInterests include machine learning, filter those who have completedCredits of at least 30, and calculate the average completedCredits of these students.", + "target_collection": "Students", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": { + "property_name": "completedCredits", + "operator": ">=", + "value": 30 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "completedCredits", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 128, + "database_schema_index": 2, + "natural_language_query": "Identify courses related to machine learning that have a courseDuration of at least 5 hours, and determine the most frequently occurring courseTitle.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify courses related to machine learning that have a courseDuration of at least 5 hours, and determine the most frequently occurring courseTitle.", + "target_collection": "Courses", + "search_query": "machine learning", + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify courses related to machine learning that have a courseDuration of at least 5 hours, and determine the most frequently occurring courseTitle.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 129, + "database_schema_index": 2, + "natural_language_query": "Find courses that semantically relate to data science and machine learning in their courseDescription, filter for those which courseDuration is at least 40 hours, and show the top 5 most common courseTitle values for these courses.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that semantically relate to data science and machine learning in their courseDescription, filter for those which courseDuration is at least 40 hours, and show the top 5 most common courseTitle values for these courses.", + "target_collection": "Courses", + "search_query": "data science and machine learning", + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 40 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that semantically relate to data science and machine learning in their courseDescription, filter for those which courseDuration is at least 40 hours, and show the top 5 most common courseTitle values for these courses.", + "target_collection": "Courses", + "search_query": "data science and machine learning", + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 40 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 130, + "database_schema_index": 2, + "natural_language_query": "List all courses related to artificial intelligence and machine learning that require at least 20 hours to complete, show the percentage of those courses currently accepting enrollments, and categorize the results by whether they are currently enrolling or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "List all courses related to artificial intelligence and machine learning that require at least 20 hours to complete, show the percentage of those courses currently accepting enrollments, and categorize the results by whether they are currently enrolling or not.", + "target_collection": "Courses", + "search_query": "Find courses related to artificial intelligence and machine learning.", + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "List all courses related to artificial intelligence and machine learning that require at least 20 hours to complete, show the percentage of those courses currently accepting enrollments, and categorize the results by whether they are currently enrolling or not.", + "target_collection": "Courses", + "search_query": "artificial intelligence and machine learning", + "limit": 5, + "integer_property_filter": { + "property_name": "hours", + "operator": ">=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 131, + "database_schema_index": 2, + "natural_language_query": "Find courses that are similar to 'data science', have a courseDuration of 40 hours or less, and calculate the percentage of these courses that are currentlyEnrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that are similar to 'data science', have a courseDuration of 40 hours or less, and calculate the percentage of these courses that are currentlyEnrolling.", + "target_collection": "Courses", + "search_query": "Find courses similar to data science that enhance learning outcomes", + "integer_property_filter": { + "property_name": "courseDuration", + "operator": "<=", + "value": 40 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that are similar to 'data science', have a courseDuration of 40 hours or less, and calculate the percentage of these courses that are currentlyEnrolling.", + "target_collection": "Courses", + "search_query": "data science", + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": "<=", + "value": 40 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 132, + "database_schema_index": 2, + "natural_language_query": "Find students interested in machine learning who have completed at least 30 credits, grouped by whether they are enrolled full-time.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find students interested in machine learning who have completed at least 30 credits, grouped by whether they are enrolled full-time.", + "target_collection": "Students", + "search_query": "students interested in machine learning", + "integer_property_filter": { + "property_name": "completedCredits", + "operator": ">=", + "value": 30 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "enrolledFullTime" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find students interested in machine learning who have completed at least 30 credits, grouped by whether they are enrolled full-time.", + "target_collection": "Students", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": { + "property_name": "credits", + "operator": ">=", + "value": 30 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "enrolledFullTime", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 133, + "database_schema_index": 2, + "natural_language_query": "Find courses that relate to artificial intelligence which have a courseDuration of at least 20 hours.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that relate to artificial intelligence which have a courseDuration of at least 20 hours.", + "target_collection": "Courses", + "search_query": "Find courses related to artificial intelligence", + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that relate to artificial intelligence which have a courseDuration of at least 20 hours.", + "target_collection": "Courses", + "search_query": "artificial intelligence", + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 134, + "database_schema_index": 2, + "natural_language_query": "What is the average duration of courses related to artificial intelligence that are currently enrolling, and organize the results by course title?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the average duration of courses related to artificial intelligence that are currently enrolling, and organize the results by course title?", + "target_collection": "Courses", + "search_query": "artificial intelligence", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average duration of courses related to artificial intelligence that are currently enrolling, and organize the results by course title?", + "target_collection": "Courses", + "search_query": "artificial intelligence", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "enrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "duration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 135, + "database_schema_index": 2, + "natural_language_query": "Search for courses whose descriptions are conceptually similar to 'machine learning and artificial intelligence', filter to find courses with the exact courseTitle 'Introduction to AI', and calculate the average courseDuration of these courses.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Search for courses whose descriptions are conceptually similar to 'machine learning and artificial intelligence', filter to find courses with the exact courseTitle 'Introduction to AI', and calculate the average courseDuration of these courses.", + "target_collection": "Courses", + "search_query": "Find me the courses that cover topics similar to 'machine learning and artificial intelligence'.", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "=", + "value": "Introduction to AI" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for courses whose descriptions are conceptually similar to 'machine learning and artificial intelligence', filter to find courses with the exact courseTitle 'Introduction to AI', and calculate the average courseDuration of these courses.", + "target_collection": "Courses", + "search_query": "machine learning and artificial intelligence", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "=", + "value": "Introduction to AI" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 136, + "database_schema_index": 2, + "natural_language_query": "Find courses related to data science and machine learning by courseDescription, filter these courses to only those that are currently open for enrollment, count the unique course titles, and then group the courses by their duration to analyze the number of courses segmented by different durations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses related to data science and machine learning by courseDescription, filter these courses to only those that are currently open for enrollment, count the unique course titles, and then group the courses by their duration to analyze the number of courses segmented by different durations.", + "target_collection": "Courses", + "search_query": "Find courses related to data science and machine learning by courseDescription", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses related to data science and machine learning by courseDescription, filter these courses to only those that are currently open for enrollment, count the unique course titles, and then group the courses by their duration to analyze the number of courses segmented by different durations.", + "target_collection": "Courses", + "search_query": "data science and machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isOpenForEnrollment", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 137, + "database_schema_index": 2, + "natural_language_query": "Find courses that focus on machine learning that are currently enrolling, and display the top 5 most common course titles.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that focus on machine learning that are currently enrolling, and display the top 5 most common course titles.", + "target_collection": "Courses", + "search_query": "Find courses that focus on machine learning", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that focus on machine learning that are currently enrolling, and display the top 5 most common course titles.", + "target_collection": "Courses", + "search_query": "courses that focus on machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 138, + "database_schema_index": 2, + "natural_language_query": "Search for courses that focus on 'machine learning' topics, filter to include only those that have 'Data Science' in their course title, calculate the percentage of these courses that are currently enrolling, and group the results by course duration.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Search for courses that focus on 'machine learning' topics, filter to include only those that have 'Data Science' in their course title, calculate the percentage of these courses that are currently enrolling, and group the results by course duration.", + "target_collection": "Courses", + "search_query": "machine learning", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Data Science" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for courses that focus on 'machine learning' topics, filter to include only those that have 'Data Science' in their course title, calculate the percentage of these courses that are currently enrolling, and group the results by course duration.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "title", + "operator": "LIKE", + "value": "%Data Science%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "duration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 139, + "database_schema_index": 2, + "natural_language_query": "Find instructors who are described as experienced in teaching computer science in their biography, specifically look for instructors named Jane Doe, and calculate the percentage of instructors who hold a tenured position in the 'tenured' field.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find instructors who are described as experienced in teaching computer science in their biography, specifically look for instructors named Jane Doe, and calculate the percentage of instructors who hold a tenured position in the 'tenured' field.", + "target_collection": "Instructors", + "search_query": "experienced in teaching computer science", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "instructorName", + "operator": "=", + "value": "Jane Doe" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "tenured", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find instructors who are described as experienced in teaching computer science in their biography, specifically look for instructors named Jane Doe, and calculate the percentage of instructors who hold a tenured position in the 'tenured' field.", + "target_collection": "Instructors", + "search_query": "experienced in teaching computer science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Jane Doe" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "tenured", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 140, + "database_schema_index": 2, + "natural_language_query": "Find courses related to Python programming where the course title contains 'Introduction', and group the results by whether the courses are currently enrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses related to Python programming where the course title contains 'Introduction', and group the results by whether the courses are currently enrolling.", + "target_collection": "Courses", + "search_query": "Python programming", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "%Introduction%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses related to Python programming where the course title contains 'Introduction', and group the results by whether the courses are currently enrolling.", + "target_collection": "Courses", + "search_query": "Python programming", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "title", + "operator": "LIKE", + "value": "Introduction" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 141, + "database_schema_index": 2, + "natural_language_query": "Show me courses that cover 'machine learning fundamentals' in their descriptions and have the word 'Advanced' in the course title.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Show me courses that cover 'machine learning fundamentals' in their descriptions and have the word 'Advanced' in the course title.", + "target_collection": "Courses", + "search_query": "Find courses that cover 'machine learning fundamentals' in courseDescription", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Advanced" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Show me courses that cover 'machine learning fundamentals' in their descriptions and have the word 'Advanced' in the course title.", + "target_collection": "Courses", + "search_query": "machine learning fundamentals Advanced", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 142, + "database_schema_index": 2, + "natural_language_query": "Search for courses related to machine learning and deep learning that are currently open for enrollment, calculate the average duration of these courses, and categorize the results based on the enrollment status of the courses.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Search for courses related to machine learning and deep learning that are currently open for enrollment, calculate the average duration of these courses, and categorize the results based on the enrollment status of the courses.", + "target_collection": "Courses", + "search_query": "Find courses related to machine learning and deep learning exploration", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for courses related to machine learning and deep learning that are currently open for enrollment, calculate the average duration of these courses, and categorize the results based on the enrollment status of the courses.", + "target_collection": "Courses", + "search_query": "machine learning and deep learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isOpenForEnrollment", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "duration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "enrollmentStatus", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.75, + "error": null + }, + { + "query_index": 143, + "database_schema_index": 2, + "natural_language_query": "What are the courses related to 'machine learning' that are currently enrolling, and what is the average course duration?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What are the courses related to 'machine learning' that are currently enrolling, and what is the average course duration?", + "target_collection": "Courses", + "search_query": "Find courses related to 'machine learning' based on courseDescription", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the courses related to 'machine learning' that are currently enrolling, and what is the average course duration?", + "target_collection": "Courses", + "search_query": "machine learning courses", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "duration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.75, + "error": null + }, + { + "query_index": 144, + "database_schema_index": 2, + "natural_language_query": "Find courses related to \"machine learning\" in courseDescription that are currently enrolling, count the number of unique courses titles, and group the results by courseDuration.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses related to \"machine learning\" in courseDescription that are currently enrolling, count the number of unique courses titles, and group the results by courseDuration.", + "target_collection": "Courses", + "search_query": "Find courses related to \"machine learning\" in courseDescription", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses related to \"machine learning\" in courseDescription that are currently enrolling, count the number of unique courses titles, and group the results by courseDuration.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 145, + "database_schema_index": 2, + "natural_language_query": "Find courses that are related to data science in courseDescription, are currently enrolling as indicated by currentlyEnrolling being true, and return the top 5 most popular course titles using courseTitle.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that are related to data science in courseDescription, are currently enrolling as indicated by currentlyEnrolling being true, and return the top 5 most popular course titles using courseTitle.", + "target_collection": "Courses", + "search_query": "Data Science", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that are related to data science in courseDescription, are currently enrolling as indicated by currentlyEnrolling being true, and return the top 5 most popular course titles using courseTitle.", + "target_collection": "Courses", + "search_query": "data science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 146, + "database_schema_index": 2, + "natural_language_query": "What are the currently enrolling courses related to 'machine learning applied techniques', and how is the enrollment status distributed across these courses by course title?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What are the currently enrolling courses related to 'machine learning applied techniques', and how is the enrollment status distributed across these courses by course title?", + "target_collection": "Courses", + "search_query": "Find courses related to 'machine learning applied techniques' in courseDescription", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the currently enrolling courses related to 'machine learning applied techniques', and how is the enrollment status distributed across these courses by course title?", + "target_collection": "Courses", + "search_query": "machine learning applied techniques", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "enrollingNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "title", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 147, + "database_schema_index": 2, + "natural_language_query": "Find courses by topics related to artificial intelligence, filter to only include those that are currently open for enrollment, and calculate the percentage of total courses that are currently enrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses by topics related to artificial intelligence, filter to only include those that are currently open for enrollment, and calculate the percentage of total courses that are currently enrolling.", + "target_collection": "Courses", + "search_query": "Find courses by topics related to artificial intelligence", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses by topics related to artificial intelligence, filter to only include those that are currently open for enrollment, and calculate the percentage of total courses that are currently enrolling.", + "target_collection": "Courses", + "search_query": "artificial intelligence", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 148, + "database_schema_index": 2, + "natural_language_query": "Find courses related to data science that are currently enrolling, and group these courses by their courseDuration to see how they vary by length.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses related to data science that are currently enrolling, and group these courses by their courseDuration to see how they vary by length.", + "target_collection": "Courses", + "search_query": "Find courses with subjects related to 'data science'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses related to data science that are currently enrolling, and group these courses by their courseDuration to see how they vary by length.", + "target_collection": "Courses", + "search_query": "data science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 149, + "database_schema_index": 2, + "natural_language_query": "Find courses with topics related to 'machine learning techniques' that are currently enrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses with topics related to 'machine learning techniques' that are currently enrolling.", + "target_collection": "Courses", + "search_query": "Find courses with topics related to 'machine learning techniques'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses with topics related to 'machine learning techniques' that are currently enrolling.", + "target_collection": "Courses", + "search_query": "machine learning techniques", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 150, + "database_schema_index": 2, + "natural_language_query": "What is the average course duration of courses related to 'machine learning fundamentals', and how does it vary between courses that are currently enrolling and those that are not?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the average course duration of courses related to 'machine learning fundamentals', and how does it vary between courses that are currently enrolling and those that are not?", + "target_collection": "Courses", + "search_query": "Find courses that match the phrase 'machine learning fundamentals'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average course duration of courses related to 'machine learning fundamentals', and how does it vary between courses that are currently enrolling and those that are not?", + "target_collection": "Courses", + "search_query": "machine learning fundamentals", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "duration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 151, + "database_schema_index": 2, + "natural_language_query": "Find courses that are conceptually similar to 'data science' and calculate the average course duration in courseDuration.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that are conceptually similar to 'data science' and calculate the average course duration in courseDuration.", + "target_collection": "Courses", + "search_query": "Find courses that best match the concept of 'data science'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that are conceptually similar to 'data science' and calculate the average course duration in courseDuration.", + "target_collection": "Courses", + "search_query": "conceptually similar to 'data science'", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 152, + "database_schema_index": 2, + "natural_language_query": "Find students who have research interests similar to quantum computing and determine the count of unique research interests, while grouping the results by whether they are enrolled full-time.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find students who have research interests similar to quantum computing and determine the count of unique research interests, while grouping the results by whether they are enrolled full-time.", + "target_collection": "Students", + "search_query": "quantum computing", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "enrolledFullTime" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find students who have research interests similar to quantum computing and determine the count of unique research interests, while grouping the results by whether they are enrolled full-time.", + "target_collection": "Students", + "search_query": "quantum computing research interests", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "researchInterests", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "enrolledFullTime", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 153, + "database_schema_index": 2, + "natural_language_query": "Find courses that are conceptually similar to 'machine learning', are currently enrolling, and identify the top 3 most common course titles.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that are conceptually similar to 'machine learning', are currently enrolling, and identify the top 3 most common course titles.", + "target_collection": "Courses", + "search_query": "Find courses related to 'machine learning' that are open for enrollment", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that are conceptually similar to 'machine learning', are currently enrolling, and identify the top 3 most common course titles.", + "target_collection": "Courses", + "search_query": "conceptually similar to machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currently_enrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "course_title", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": "course_title", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 154, + "database_schema_index": 2, + "natural_language_query": "Find the most relevant students based on research interests around 'machine learning', calculate the percentage of those students enrolled full-time, and group the results by their research interests.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find the most relevant students based on research interests around 'machine learning', calculate the percentage of those students enrolled full-time, and group the results by their research interests.", + "target_collection": "Students", + "search_query": "Find the most relevant students based on research interests around 'machine learning'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "enrolledFullTime", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "researchInterests" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the most relevant students based on research interests around 'machine learning', calculate the percentage of those students enrolled full-time, and group the results by their research interests.", + "target_collection": "Students", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "enrolledFullTime", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "researchInterests", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 155, + "database_schema_index": 2, + "natural_language_query": "Find the number of courses with courseTitle or courseDescription related to 'Data Science', and summarize how many of these courses are currently open for enrollment.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find the number of courses with courseTitle or courseDescription related to 'Data Science', and summarize how many of these courses are currently open for enrollment.", + "target_collection": "Courses", + "search_query": "Data Science", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 156, + "database_schema_index": 2, + "natural_language_query": "Find courses whose courseDescription is similar to 'machine learning foundations' and group these courses by their currentlyEnrolling status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses whose courseDescription is similar to 'machine learning foundations' and group these courses by their currentlyEnrolling status.", + "target_collection": "Courses", + "search_query": "Find courses whose courseDescription is similar to 'machine learning foundations'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses whose courseDescription is similar to 'machine learning foundations' and group these courses by their currentlyEnrolling status.", + "target_collection": "Courses", + "search_query": "machine learning foundations", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 157, + "database_schema_index": 2, + "natural_language_query": "Find courses with a courseDescription that covers the entire data science lifecycle, including data collection, processing, analysis, and presentation.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses with a courseDescription that covers the entire data science lifecycle, including data collection, processing, analysis, and presentation.", + "target_collection": "Courses", + "search_query": "Find courses that cover the entire data science lifecycle, including data collection, processing, analysis, and presentation.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses with a courseDescription that covers the entire data science lifecycle, including data collection, processing, analysis, and presentation.", + "target_collection": "Courses", + "search_query": "entire data science lifecycle, including data collection, processing, analysis, and presentation", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 158, + "database_schema_index": 2, + "natural_language_query": "Count the number of instructors grouped by tenured status who have at least 10 years in yearsOfTeaching.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Count the number of instructors grouped by tenured status who have at least 10 years in yearsOfTeaching.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured" + }, + "predicted_query": { + "corresponding_natural_language_query": "Count the number of instructors grouped by tenured status who have at least 10 years in yearsOfTeaching.", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 159, + "database_schema_index": 2, + "natural_language_query": "Find the total number of instructors who have been teaching for at least 10 years based on their yearsOfTeaching.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find the total number of instructors who have been teaching for at least 10 years based on their yearsOfTeaching.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the total number of instructors who have been teaching for at least 10 years based on their yearsOfTeaching.", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "yearsOfTeaching", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 160, + "database_schema_index": 2, + "natural_language_query": "Identify instructors who have been teaching for at least 10 years. For these instructors, summarize how frequently different words appear in their biography, and categorize them based on whether they hold tenured positions.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify instructors who have been teaching for at least 10 years. For these instructors, summarize how frequently different words appear in their biography, and categorize them based on whether they hold tenured positions.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify instructors who have been teaching for at least 10 years. For these instructors, summarize how frequently different words appear in their biography, and categorize them based on whether they hold tenured positions.", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "biography", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "tenured", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 161, + "database_schema_index": 2, + "natural_language_query": "Find instructors who have at least 10 yearsOfTeaching and determine the top 5 most common attributes mentioned in their biography.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find instructors who have at least 10 yearsOfTeaching and determine the top 5 most common attributes mentioned in their biography.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "biography", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find instructors who have at least 10 yearsOfTeaching and determine the top 5 most common attributes mentioned in their biography.", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "biography", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 162, + "database_schema_index": 2, + "natural_language_query": "Find all instructors with more than 5 years in yearsOfTeaching, show the count of tenured status and group the results by instructorName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find all instructors with more than 5 years in yearsOfTeaching, show the count of tenured status and group the results by instructorName.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "instructorName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all instructors with more than 5 years in yearsOfTeaching, show the count of tenured status and group the results by instructorName.", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "tenured", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "instructorName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 163, + "database_schema_index": 2, + "natural_language_query": "Find courses with a courseDuration of at least 20 hours and determine how many of these are currently enrolling by counting the boolean currentlyEnrolling field.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses with a courseDuration of at least 20 hours and determine how many of these are currently enrolling by counting the boolean currentlyEnrolling field.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses with a courseDuration of at least 20 hours and determine how many of these are currently enrolling by counting the boolean currentlyEnrolling field.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 164, + "database_schema_index": 2, + "natural_language_query": "Identify instructors who have more than 10 years of teaching experience and group them by whether they hold a tenured position.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify instructors who have more than 10 years of teaching experience and group them by whether they hold a tenured position.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify instructors who have more than 10 years of teaching experience and group them by whether they hold a tenured position.", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 165, + "database_schema_index": 2, + "natural_language_query": "Find courses that have a courseDuration greater than 10 hours.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that have a courseDuration greater than 10 hours.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that have a courseDuration greater than 10 hours.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 166, + "database_schema_index": 2, + "natural_language_query": "Find all courses containing 'machine learning' in the courseDescription, then group them by currentlyEnrolling status and determine the maximum courseDuration in each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find all courses containing 'machine learning' in the courseDescription, then group them by currentlyEnrolling status and determine the maximum courseDuration in each group.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "machine learning" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all courses containing 'machine learning' in the courseDescription, then group them by currentlyEnrolling status and determine the maximum courseDuration in each group.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 167, + "database_schema_index": 2, + "natural_language_query": "Find the average courseDuration of all courses that have 'Python' in their courseDescription.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find the average courseDuration of all courses that have 'Python' in their courseDescription.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "Python" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the average courseDuration of all courses that have 'Python' in their courseDescription.", + "target_collection": "Courses", + "search_query": "Python", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 168, + "database_schema_index": 2, + "natural_language_query": "Identify whether courses that mention 'machine learning' in their courseDescription are currently enrolling, group these courses by their currentlyEnrolling status, and list the top 5 most common courseTitles for each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify whether courses that mention 'machine learning' in their courseDescription are currently enrolling, group these courses by their currentlyEnrolling status, and list the top 5 most common courseTitles for each group.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "machine learning" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify whether courses that mention 'machine learning' in their courseDescription are currently enrolling, group these courses by their currentlyEnrolling status, and list the top 5 most common courseTitles for each group.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 169, + "database_schema_index": 2, + "natural_language_query": "Find and count courses with 'data science' in the courseDescription by using the courseDescription text_property_filter with LIKE, and count the total number of different course titles using courseTitle text_property_aggregation COUNT.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find and count courses with 'data science' in the courseDescription by using the courseDescription text_property_filter with LIKE, and count the total number of different course titles using courseTitle text_property_aggregation COUNT.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "data science" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find and count courses with 'data science' in the courseDescription by using the courseDescription text_property_filter with LIKE, and count the total number of different course titles using courseTitle text_property_aggregation COUNT.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "data science" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 170, + "database_schema_index": 2, + "natural_language_query": "Identify all courses that include 'Data Science' in their courseTitle, count how many of these courses are currentlyEnrolling, and group the results by courseDuration to show how courses of different durations are distributed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify all courses that include 'Data Science' in their courseTitle, count how many of these courses are currentlyEnrolling, and group the results by courseDuration to show how courses of different durations are distributed.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Data Science" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify all courses that include 'Data Science' in their courseTitle, count how many of these courses are currentlyEnrolling, and group the results by courseDuration to show how courses of different durations are distributed.", + "target_collection": "Courses", + "search_query": "Data Science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "courseDuration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 171, + "database_schema_index": 2, + "natural_language_query": "Find courses where the courseTitle contains 'Advanced' and calculate the percentage of these that are currentlyEnrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses where the courseTitle contains 'Advanced' and calculate the percentage of these that are currentlyEnrolling.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Advanced" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses where the courseTitle contains 'Advanced' and calculate the percentage of these that are currentlyEnrolling.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "%Advanced%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 172, + "database_schema_index": 2, + "natural_language_query": "Find courses containing 'Introduction to Data Science' in the courseTitle, and group the results by currentlyEnrolling status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses containing 'Introduction to Data Science' in the courseTitle, and group the results by currentlyEnrolling status.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Introduction to Data Science" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses containing 'Introduction to Data Science' in the courseTitle, and group the results by currentlyEnrolling status.", + "target_collection": "Courses", + "search_query": "Introduction to Data Science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 173, + "database_schema_index": 2, + "natural_language_query": "Find courses where the courseDescription includes the phrase 'machine learning'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses where the courseDescription includes the phrase 'machine learning'.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "machine learning" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses where the courseDescription includes the phrase 'machine learning'.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 174, + "database_schema_index": 2, + "natural_language_query": "Find courses that are currently enrolling and group them by courseTitle, calculating the total sum of courseDuration for each courseTitle.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that are currently enrolling and group them by courseTitle, calculating the total sum of courseDuration for each courseTitle.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that are currently enrolling and group them by courseTitle, calculating the total sum of courseDuration for each courseTitle.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 175, + "database_schema_index": 2, + "natural_language_query": "What is the total number of hours required to complete all courses that are currently open for enrollment?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the total number of hours required to complete all courses that are currently open for enrollment?", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the total number of hours required to complete all courses that are currently open for enrollment?", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openForEnrollment", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "durationHours", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9, + "error": null + }, + { + "query_index": 176, + "database_schema_index": 2, + "natural_language_query": "Identify courses that are currently open for enrollment (using currentlyEnrolling = true), and group them by courseDuration while aggregating the top 5 most common courseTitle values.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify courses that are currently open for enrollment (using currentlyEnrolling = true), and group them by courseDuration while aggregating the top 5 most common courseTitle values.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify courses that are currently open for enrollment (using currentlyEnrolling = true), and group them by courseDuration while aggregating the top 5 most common courseTitle values.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 177, + "database_schema_index": 2, + "natural_language_query": "Retrieve courses that are currentlyEnrolling and count the number of unique courseTitle entries to understand how many different courses are currently open for enrollment.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Retrieve courses that are currentlyEnrolling and count the number of unique courseTitle entries to understand how many different courses are currently open for enrollment.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Retrieve courses that are currentlyEnrolling and count the number of unique courseTitle entries to understand how many different courses are currently open for enrollment.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 178, + "database_schema_index": 2, + "natural_language_query": "Find courses where currentlyEnrolling is true, calculate the percentage of such courses, and group the results by courseTitle to see enrollment status per course.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses where currentlyEnrolling is true, calculate the percentage of such courses, and group the results by courseTitle to see enrollment status per course.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses where currentlyEnrolling is true, calculate the percentage of such courses, and group the results by courseTitle to see enrollment status per course.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 179, + "database_schema_index": 2, + "natural_language_query": "Find all courses that are currently open for enrollment and calculate the total number of courses where the currentlyEnrolling property is true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find all courses that are currently open for enrollment and calculate the total number of courses where the currentlyEnrolling property is true.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all courses that are currently open for enrollment and calculate the total number of courses where the currentlyEnrolling property is true.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 180, + "database_schema_index": 2, + "natural_language_query": "Find all course titles where courses are currently enrolling and group the results by course title.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find all course titles where courses are currently enrolling and group the results by course title.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all course titles where courses are currently enrolling and group the results by course title.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 181, + "database_schema_index": 2, + "natural_language_query": "Find courses where currentlyEnrolling is true", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses where currentlyEnrolling is true", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses where currentlyEnrolling is true", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 182, + "database_schema_index": 2, + "natural_language_query": "What is the average yearsOfTeaching of instructors, grouped by their tenured status?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the average yearsOfTeaching of instructors, grouped by their tenured status?", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfTeaching", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average yearsOfTeaching of instructors, grouped by their tenured status?", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfTeaching", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 183, + "database_schema_index": 2, + "natural_language_query": "What is the average and maximum number of years instructors have been teaching in the yearsOfTeaching property of the Instructors collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the average and maximum number of years instructors have been teaching in the yearsOfTeaching property of the Instructors collection?", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfTeaching", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average and maximum number of years instructors have been teaching in the yearsOfTeaching property of the Instructors collection?", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfTeaching", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 184, + "database_schema_index": 2, + "natural_language_query": "What is the count of each unique courseTitle for Courses, grouped by their currentlyEnrolling status?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the count of each unique courseTitle for Courses, grouped by their currentlyEnrolling status?", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the count of each unique courseTitle for Courses, grouped by their currentlyEnrolling status?", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 185, + "database_schema_index": 2, + "natural_language_query": "Count unique courseTitle values and find the top 5 most common course titles.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Count unique courseTitle values and find the top 5 most common course titles.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Count unique courseTitle values and find the top 5 most common course titles.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 186, + "database_schema_index": 2, + "natural_language_query": "What percentage of courses are currently open for enrollment and how are these courses grouped by course duration?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What percentage of courses are currently open for enrollment and how are these courses grouped by course duration?", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "What percentage of courses are currently open for enrollment and how are these courses grouped by course duration?", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseDuration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 187, + "database_schema_index": 2, + "natural_language_query": "Calculate how many courses in the Courses collection are currently open for enrollment, and determine the percentage of courses that are currently enrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Calculate how many courses in the Courses collection are currently open for enrollment, and determine the percentage of courses that are currently enrolling.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate how many courses in the Courses collection are currently open for enrollment, and determine the percentage of courses that are currently enrolling.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 188, + "database_schema_index": 2, + "natural_language_query": "What is the average years of teaching for instructors grouped by their tenured status using groupby on tenured?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the average years of teaching for instructors grouped by their tenured status using groupby on tenured?", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average years of teaching for instructors grouped by their tenured status using groupby on tenured?", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfTeaching", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 189, + "database_schema_index": 2, + "natural_language_query": "What is the average packagePrice of travel packages whose packageDetails correspond to 'tropical beach relaxation' and have a price less than $1500, grouped by whether a discount is available?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What is the average packagePrice of travel packages whose packageDetails correspond to 'tropical beach relaxation' and have a price less than $1500, grouped by whether a discount is available?", + "target_collection": "TravelPackages", + "search_query": "Find travel packages whose packageDetails match 'tropical beach relaxation'", + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average packagePrice of travel packages whose packageDetails correspond to 'tropical beach relaxation' and have a price less than $1500, grouped by whether a discount is available?", + "target_collection": "Travel_packages", + "search_query": "tropical beach relaxation", + "limit": 5, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 190, + "database_schema_index": 2, + "natural_language_query": "Find travel destinations that are related to exotic beaches and vibrant nightlife but have an averageVisitCost of no more than $1500. Additionally, determine the maximum averageVisitCost among destinations that are popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that are related to exotic beaches and vibrant nightlife but have an averageVisitCost of no more than $1500. Additionally, determine the maximum averageVisitCost among destinations that are popular.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations related to exotic beaches and vibrant nightlife from destinationDescription", + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that are related to exotic beaches and vibrant nightlife but have an averageVisitCost of no more than $1500. Additionally, determine the maximum averageVisitCost among destinations that are popular.", + "target_collection": "TravelDestinations", + "search_query": "exotic beaches and vibrant nightlife", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 191, + "database_schema_index": 2, + "natural_language_query": "Find destinations where the description includes 'hot and sunny beaches with vibrant nightlife', the averageVisitCost is less than or equal to 1500, count how many destinations are popular, and group the results by destinationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find destinations where the description includes 'hot and sunny beaches with vibrant nightlife', the averageVisitCost is less than or equal to 1500, count how many destinations are popular, and group the results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "hot and sunny beaches with vibrant nightlife", + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find destinations where the description includes 'hot and sunny beaches with vibrant nightlife', the averageVisitCost is less than or equal to 1500, count how many destinations are popular, and group the results by destinationName.", + "target_collection": "Destinations", + "search_query": "hot and sunny beaches with vibrant nightlife", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 192, + "database_schema_index": 3, + "natural_language_query": "Find travel packages that include safaris and beaches with a packagePrice less than 1000. Also, count how many times each packageName appears in the results.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel packages that include safaris and beaches with a packagePrice less than 1000. Also, count how many times each packageName appears in the results.", + "target_collection": "TravelPackages", + "search_query": "Find travel packages that include safaris and beaches", + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<", + "value": 1000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel packages that include safaris and beaches with a packagePrice less than 1000. Also, count how many times each packageName appears in the results.", + "target_collection": "TravelPackages", + "search_query": "safaris and beaches", + "limit": 5, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<", + "value": 1000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "packageName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 193, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that offer peaceful beach vacations, where the averageVisitCost is less than or equal to 1500, count how many of these are popular, and group the results by destinationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that offer peaceful beach vacations, where the averageVisitCost is less than or equal to 1500, count how many of these are popular, and group the results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations that offer peaceful beach vacations", + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that offer peaceful beach vacations, where the averageVisitCost is less than or equal to 1500, count how many of these are popular, and group the results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "peaceful beach vacations", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 194, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations with beautiful beaches and rich cultural experiences where the averageVisitCost is no more than 1500, and determine what percentage of these destinations are currently popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations with beautiful beaches and rich cultural experiences where the averageVisitCost is no more than 1500, and determine what percentage of these destinations are currently popular.", + "target_collection": "TravelDestinations", + "search_query": "I want to find travel destinations with beautiful beaches and rich cultural experiences.", + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations with beautiful beaches and rich cultural experiences where the averageVisitCost is no more than 1500, and determine what percentage of these destinations are currently popular.", + "target_collection": "TravelDestinations", + "search_query": "beautiful beaches and rich cultural experiences", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyPopular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 195, + "database_schema_index": 3, + "natural_language_query": "Search for a relaxing vacation package that includes beach activities and cultural tours, filter for packages with a packagePrice greater than 2000, and organize the results based on whether a discount is available, using discountAvailable as the grouping property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Search for a relaxing vacation package that includes beach activities and cultural tours, filter for packages with a packagePrice greater than 2000, and organize the results based on whether a discount is available, using discountAvailable as the grouping property.", + "target_collection": "TravelPackages", + "search_query": "A relaxing vacation package with beach activities and cultural tours", + "integer_property_filter": { + "property_name": "packagePrice", + "operator": ">", + "value": 2000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for a relaxing vacation package that includes beach activities and cultural tours, filter for packages with a packagePrice greater than 2000, and organize the results based on whether a discount is available, using discountAvailable as the grouping property.", + "target_collection": "VacationPackages", + "search_query": "relaxing vacation package that includes beach activities and cultural tours", + "limit": 5, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": ">", + "value": 2000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 196, + "database_schema_index": 3, + "natural_language_query": "Find travel packages described as a 'relaxing beach holiday' with a packagePrice of at most $500.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel packages described as a 'relaxing beach holiday' with a packagePrice of at most $500.", + "target_collection": "TravelPackages", + "search_query": "Find travel packages described as a 'relaxing beach holiday'.", + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<=", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel packages described as a 'relaxing beach holiday' with a packagePrice of at most $500.", + "target_collection": "TravelPackages", + "search_query": "relaxing beach holiday", + "limit": 5, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<=", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 197, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations with descriptions similar to 'beach and cultural experiences', filter for destinations named Bali, calculate the average of averageVisitCost, and group by whether destinations are popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations with descriptions similar to 'beach and cultural experiences', filter for destinations named Bali, calculate the average of averageVisitCost, and group by whether destinations are popular.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations with descriptions similar to 'beach and cultural experiences'", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "=", + "value": "Bali" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations with descriptions similar to 'beach and cultural experiences', filter for destinations named Bali, calculate the average of averageVisitCost, and group by whether destinations are popular.", + "target_collection": "TravelDestinations", + "search_query": "beach and cultural experiences", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Bali" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 198, + "database_schema_index": 3, + "natural_language_query": "Find destinations whose descriptions semantically emphasize beautiful landscapes, specifically retrieve destinations named \"Bora Bora\", and determine the maximum average visit cost among all destinations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find destinations whose descriptions semantically emphasize beautiful landscapes, specifically retrieve destinations named \"Bora Bora\", and determine the maximum average visit cost among all destinations.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations with descriptions that emphasize beautiful landscapes", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "=", + "value": "Bora Bora" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find destinations whose descriptions semantically emphasize beautiful landscapes, specifically retrieve destinations named \"Bora Bora\", and determine the maximum average visit cost among all destinations.", + "target_collection": "Destinations", + "search_query": "beautiful landscapes", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Bora Bora" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 199, + "database_schema_index": 3, + "natural_language_query": "Find the most frequently occurring travel destinations that are popular among tourists, and match the phrase 'tropical beaches with vibrant nightlife', grouping them by their names and aggregating the count of each destination name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find the most frequently occurring travel destinations that are popular among tourists, and match the phrase 'tropical beaches with vibrant nightlife', grouping them by their names and aggregating the count of each destination name.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that match the phrase 'tropical beaches with vibrant nightlife'", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "popular", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the most frequently occurring travel destinations that are popular among tourists, and match the phrase 'tropical beaches with vibrant nightlife', grouping them by their names and aggregating the count of each destination name.", + "target_collection": "Travel_destinations", + "search_query": "tropical beaches with vibrant nightlife", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 200, + "database_schema_index": 3, + "natural_language_query": "Find destinations with tropical experiences as described in the destinationDescription, locate destinations that have 'Beach' included in the destinationName, and count how many destinations are currently marked as popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find destinations with tropical experiences as described in the destinationDescription, locate destinations that have 'Beach' included in the destinationName, and count how many destinations are currently marked as popular.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations with tropical experiences in destinationDescription", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "Beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find destinations with tropical experiences as described in the destinationDescription, locate destinations that have 'Beach' included in the destinationName, and count how many destinations are currently marked as popular.", + "target_collection": "Destinations", + "search_query": "tropical experiences", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "%Beach%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isPopular", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 201, + "database_schema_index": 3, + "natural_language_query": "Find destinations with a description similar to 'scenic views', filter those with 'island' in their destinationName, group results by destinationName, and calculate the percentage of popular destinations within each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find destinations with a description similar to 'scenic views', filter those with 'island' in their destinationName, group results by destinationName, and calculate the percentage of popular destinations within each group.", + "target_collection": "TravelDestinations", + "search_query": "scenic views", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "%island%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find destinations with a description similar to 'scenic views', filter those with 'island' in their destinationName, group results by destinationName, and calculate the percentage of popular destinations within each group.", + "target_collection": "Destinations", + "search_query": "scenic views", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "%island%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 202, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that are relevant to a charming winter holiday experience with various activities. Additionally, filter results to include only destinations named 'Swiss Alps', and count how many of these destinations are currently popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that are relevant to a charming winter holiday experience with various activities. Additionally, filter results to include only destinations named 'Swiss Alps', and count how many of these destinations are currently popular.", + "target_collection": "TravelDestinations", + "search_query": "I am looking for a charming winter holiday experience with various activities.", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "=", + "value": "Swiss Alps" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that are relevant to a charming winter holiday experience with various activities. Additionally, filter results to include only destinations named 'Swiss Alps', and count how many of these destinations are currently popular.", + "target_collection": "TravelDestinations", + "search_query": "charming winter holiday experience with various activities", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Swiss Alps" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isPopular", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 203, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that offer a cultural experience in their description, include 'Paris' in the destination name, and group the results by whether they are currently popular among tourists.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that offer a cultural experience in their description, include 'Paris' in the destination name, and group the results by whether they are currently popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": "A cultural experience", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "%Paris%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that offer a cultural experience in their description, include 'Paris' in the destination name, and group the results by whether they are currently popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": "cultural experience in description", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "%Paris%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "isPopularAmongTourists", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 204, + "database_schema_index": 3, + "natural_language_query": "Find travel packages that are conceptually similar to a relaxing beach vacation and have 'Caribbean' in the packageName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel packages that are conceptually similar to a relaxing beach vacation and have 'Caribbean' in the packageName.", + "target_collection": "TravelPackages", + "search_query": "relaxing beach vacation", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "packageName", + "operator": "LIKE", + "value": "Caribbean" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel packages that are conceptually similar to a relaxing beach vacation and have 'Caribbean' in the packageName.", + "target_collection": "TravelPackages", + "search_query": "relaxing beach vacation", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "packageName", + "operator": "LIKE", + "value": "%Caribbean%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 205, + "database_schema_index": 3, + "natural_language_query": "Search for travel destinations with scenic beaches and vibrant local culture, filter for those that are currently popular, calculate the average cost to visit, and group by destination name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Search for travel destinations with scenic beaches and vibrant local culture, filter for those that are currently popular, calculate the average cost to visit, and group by destination name.", + "target_collection": "TravelDestinations", + "search_query": "Scenic beaches with vibrant local culture", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for travel destinations with scenic beaches and vibrant local culture, filter for those that are currently popular, calculate the average cost to visit, and group by destination name.", + "target_collection": "Travel_destinations", + "search_query": "scenic beaches and vibrant local culture", + "limit": 5, + "integer_property_filter": { + "property_name": "popularity", + "operator": ">", + "value": 0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "average_cost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destination_name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 206, + "database_schema_index": 3, + "natural_language_query": "Identify popular travel destinations described as tropical beaches and places with rich cultural history, and compute the average cost of visiting these popular locations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Identify popular travel destinations described as tropical beaches and places with rich cultural history, and compute the average cost of visiting these popular locations.", + "target_collection": "TravelDestinations", + "search_query": "Find tropical beaches and cultural destinations with rich histories.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify popular travel destinations described as tropical beaches and places with rich cultural history, and compute the average cost of visiting these popular locations.", + "target_collection": "TravelDestinations", + "search_query": "tropical beaches rich cultural history", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 207, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations related to beach vacations that are popular, categorize them by destinationName, and identify the top 5 most common destination names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations related to beach vacations that are popular, categorize them by destinationName, and identify the top 5 most common destination names.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations related to beach vacations", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations related to beach vacations that are popular, categorize them by destinationName, and identify the top 5 most common destination names.", + "target_collection": "TravelDestinations", + "search_query": "beach vacations", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 208, + "database_schema_index": 3, + "natural_language_query": "Find the most relevant travel destinations with scenic beaches and vibrant nightlife among those that are currently popular, and count how many travel destinations are there.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find the most relevant travel destinations with scenic beaches and vibrant nightlife among those that are currently popular, and count how many travel destinations are there.", + "target_collection": "TravelDestinations", + "search_query": "description: 'Describe destinations with scenic beaches and vibrant nightlife'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 209, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that match 'tropical beaches with vibrant cultures' in their destinationDescription, filter them to show only those that are currently popular, calculate the percentage of destinations that are popular, and group the results by destinationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that match 'tropical beaches with vibrant cultures' in their destinationDescription, filter them to show only those that are currently popular, calculate the percentage of destinations that are popular, and group the results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that match 'tropical beaches with vibrant cultures' in destinationDescription", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that match 'tropical beaches with vibrant cultures' in their destinationDescription, filter them to show only those that are currently popular, calculate the percentage of destinations that are popular, and group the results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "tropical beaches with vibrant cultures", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isPopular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isPopular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9, + "error": null + }, + { + "query_index": 210, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations with sunny beaches and vibrant nightlife, filter for where they are currently popular, and count these popular destinations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations with sunny beaches and vibrant nightlife, filter for where they are currently popular, and count these popular destinations.", + "target_collection": "TravelDestinations", + "search_query": "sunny beaches and vibrant nightlife", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations with sunny beaches and vibrant nightlife, filter for where they are currently popular, and count these popular destinations.", + "target_collection": "TravelDestinations", + "search_query": "sunny beaches and vibrant nightlife", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyPopular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPopular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 211, + "database_schema_index": 3, + "natural_language_query": "Find popular travel destinations with descriptions that include scenic vistas and vibrant cultures, and group these destinations by their destinationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find popular travel destinations with descriptions that include scenic vistas and vibrant cultures, and group these destinations by their destinationName.", + "target_collection": "TravelDestinations", + "search_query": "Explore scenic vistas and vibrant cultures", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find popular travel destinations with descriptions that include scenic vistas and vibrant cultures, and group these destinations by their destinationName.", + "target_collection": "TravelDestinations", + "search_query": "scenic vistas and vibrant cultures", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 212, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that are popular and include descriptions related to 'tropical beaches and adventure sports'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that are popular and include descriptions related to 'tropical beaches and adventure sports'.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that include descriptions related to 'tropical beaches and adventure sports' within the destinationDescription.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that are popular and include descriptions related to 'tropical beaches and adventure sports'.", + "target_collection": "TravelDestinations", + "search_query": "tropical beaches and adventure sports", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 213, + "database_schema_index": 3, + "natural_language_query": "Identify travel packages providing a relaxing beach holiday (using search_query on packageDetails). Within these, calculate the average packagePrice (using int_property_aggregation on packagePrice), and group the results by whether there is a discountAvailable (using groupby on discountAvailable).", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Identify travel packages providing a relaxing beach holiday (using search_query on packageDetails). Within these, calculate the average packagePrice (using int_property_aggregation on packagePrice), and group the results by whether there is a discountAvailable (using groupby on discountAvailable).", + "target_collection": "TravelPackages", + "search_query": "Find travel packages that offer a relaxing beach holiday", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify travel packages providing a relaxing beach holiday (using search_query on packageDetails). Within these, calculate the average packagePrice (using int_property_aggregation on packagePrice), and group the results by whether there is a discountAvailable (using groupby on discountAvailable).", + "target_collection": "Packages", + "search_query": "relaxing beach holiday", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 214, + "database_schema_index": 3, + "natural_language_query": "What is the average cost of visiting tropical beach resorts described in detail?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What is the average cost of visiting tropical beach resorts described in detail?", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that match the detailed description of tropical beach resorts.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average cost of visiting tropical beach resorts described in detail?", + "target_collection": "Visiting_Tropical_Beach_Resorts", + "search_query": "tropical beach resorts", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "cost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 215, + "database_schema_index": 3, + "natural_language_query": "List travel destinations matching a description of 'tropical beaches', count the different destination names, and group results by whether they are popular to see which group has more destinations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "List travel destinations matching a description of 'tropical beaches', count the different destination names, and group results by whether they are popular to see which group has more destinations.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that best match the description 'tropical beaches'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "List travel destinations matching a description of 'tropical beaches', count the different destination names, and group results by whether they are popular to see which group has more destinations.", + "target_collection": "Destinations", + "search_query": "tropical beaches", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 216, + "database_schema_index": 3, + "natural_language_query": "Find destinations that are conceptually similar to 'romantic getaway with beach access', and also list the top 5 most common destination names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find destinations that are conceptually similar to 'romantic getaway with beach access', and also list the top 5 most common destination names.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations that are conceptually similar to 'romantic getaway with beach access'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find destinations that are conceptually similar to 'romantic getaway with beach access', and also list the top 5 most common destination names.", + "target_collection": "Destinations", + "search_query": "romantic getaway with beach access", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 217, + "database_schema_index": 3, + "natural_language_query": "What percentage of destinations, grouped by destination names, are popular among tourists, and which of these have similar descriptions to 'romantic beaches with vibrant nightlife'? Please find matching entries using semantic search, and analyze the proportion of those considered popular using boolean property aggregation for the 'popular' field.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What percentage of destinations, grouped by destination names, are popular among tourists, and which of these have similar descriptions to 'romantic beaches with vibrant nightlife'? Please find matching entries using semantic search, and analyze the proportion of those considered popular using boolean property aggregation for the 'popular' field.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations similar to 'romantic beaches with vibrant nightlife.'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "What percentage of destinations, grouped by destination names, are popular among tourists, and which of these have similar descriptions to 'romantic beaches with vibrant nightlife'? Please find matching entries using semantic search, and analyze the proportion of those considered popular using boolean property aggregation for the 'popular' field.", + "target_collection": "Destinations", + "search_query": "romantic beaches with vibrant nightlife", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 218, + "database_schema_index": 3, + "natural_language_query": "What percentage of travel destinations, that match snowy mountains and vibrant city life descriptions, are currently popular among tourists?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What percentage of travel destinations, that match snowy mountains and vibrant city life descriptions, are currently popular among tourists?", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that match descriptions of snowy mountains and vibrant city life.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What percentage of travel destinations, that match snowy mountains and vibrant city life descriptions, are currently popular among tourists?", + "target_collection": "TravelDestinations", + "search_query": "snowy mountains and vibrant city life", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popularAmongTourists", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 219, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that match the theme 'tropical beach with vibrant nightlife', and group the results based on whether they are popular among tourists.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that match the theme 'tropical beach with vibrant nightlife', and group the results based on whether they are popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that match the query \"tropical beach with vibrant nightlife\".", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that match the theme 'tropical beach with vibrant nightlife', and group the results based on whether they are popular among tourists.", + "target_collection": "Travel_destinations", + "search_query": "tropical beach with vibrant nightlife", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popularAmongTourists", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 220, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that are conceptually similar to 'romantic nature getaways' based on the destinationDescription.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that are conceptually similar to 'romantic nature getaways' based on the destinationDescription.", + "target_collection": "TravelDestinations", + "search_query": "{\"destinationDescription\":{\"operator\":\"search_query\",\"value\":\"romantic nature getaways\"}}", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that are conceptually similar to 'romantic nature getaways' based on the destinationDescription.", + "target_collection": "Destinations", + "search_query": "romantic nature getaways", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 221, + "database_schema_index": 3, + "natural_language_query": "Count how many travel agents have more than 5 years of experience, and group them by their agentName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Count how many travel agents have more than 5 years of experience, and group them by their agentName.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "agentName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Count how many travel agents have more than 5 years of experience, and group them by their agentName.", + "target_collection": "Travel_agents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "experienceYears", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "agentName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 222, + "database_schema_index": 3, + "natural_language_query": "Find travel agents who have at least 10 years in yearsOfExperience and determine the average years of experience among all travel agents.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel agents who have at least 10 years in yearsOfExperience and determine the average years of experience among all travel agents.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel agents who have at least 10 years in yearsOfExperience and determine the average years of experience among all travel agents.", + "target_collection": "Travel_agents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 223, + "database_schema_index": 3, + "natural_language_query": "Find travel agents who have at least 5 years in yearsOfExperience, count how many travel agents share the same agentName, and categorize the results based on whether they are availableNow.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel agents who have at least 5 years in yearsOfExperience, count how many travel agents share the same agentName, and categorize the results based on whether they are availableNow.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "availableNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel agents who have at least 5 years in yearsOfExperience, count how many travel agents share the same agentName, and categorize the results based on whether they are availableNow.", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "agentName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "availableNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 224, + "database_schema_index": 3, + "natural_language_query": "Show all travel agents with at least 5 years of experience and count the number of unique agentName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Show all travel agents with at least 5 years of experience and count the number of unique agentName.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Show all travel agents with at least 5 years of experience and count the number of unique agentName.", + "target_collection": "Travel Agents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "agentName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 225, + "database_schema_index": 3, + "natural_language_query": "Find travel packages that cost no more than 2000 in packagePrice, group these results by packageName, and count the total number of packages with discounts by evaluating discountAvailable.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel packages that cost no more than 2000 in packagePrice, group these results by packageName, and count the total number of packages with discounts by evaluating discountAvailable.", + "target_collection": "TravelPackages", + "search_query": null, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<=", + "value": 2000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "packageName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel packages that cost no more than 2000 in packagePrice, group these results by packageName, and count the total number of packages with discounts by evaluating discountAvailable.", + "target_collection": "Travel_packages", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<=", + "value": 2000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "discountAvailable", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "packageName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 226, + "database_schema_index": 3, + "natural_language_query": "Find travel agents with at least 5 years of experience and count how many are available now.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel agents with at least 5 years of experience and count how many are available now.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel agents with at least 5 years of experience and count how many are available now.", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "availableNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 227, + "database_schema_index": 3, + "natural_language_query": "Group travel agents by their yearsOfExperience and only include those that have more than 5 years in yearsOfExperience.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Group travel agents by their yearsOfExperience and only include those that have more than 5 years in yearsOfExperience.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "yearsOfExperience" + }, + "predicted_query": { + "corresponding_natural_language_query": "Group travel agents by their yearsOfExperience and only include those that have more than 5 years in yearsOfExperience.", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "yearsOfExperience", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 228, + "database_schema_index": 3, + "natural_language_query": "Find travel agents with at least 5 years of experience in yearsOfExperience.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel agents with at least 5 years of experience in yearsOfExperience.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel agents with at least 5 years of experience in yearsOfExperience.", + "target_collection": "Travel_agents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 229, + "database_schema_index": 3, + "natural_language_query": "Find travel packages where the packageDetails include the keyword 'luxury', then compute the average of packagePrice for packages where discountAvailable is true, and group the results based on whether a discount is available.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel packages where the packageDetails include the keyword 'luxury', then compute the average of packagePrice for packages where discountAvailable is true, and group the results based on whether a discount is available.", + "target_collection": "TravelPackages", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "packageDetails", + "operator": "LIKE", + "value": "luxury" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel packages where the packageDetails include the keyword 'luxury', then compute the average of packagePrice for packages where discountAvailable is true, and group the results based on whether a discount is available.", + "target_collection": "TravelPackages", + "search_query": "luxury", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "discountAvailable", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 230, + "database_schema_index": 3, + "natural_language_query": "Determine the average averageVisitCost for travel destinations where destinationDescription contains the keyword 'beach'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Determine the average averageVisitCost for travel destinations where destinationDescription contains the keyword 'beach'.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Determine the average averageVisitCost for travel destinations where destinationDescription contains the keyword 'beach'.", + "target_collection": "Travel destinations", + "search_query": "beach", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 231, + "database_schema_index": 3, + "natural_language_query": "List all travel destinations where the destinationDescription mentions 'popular', count how many destinations have such a description, and group these results by destinationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "List all travel destinations where the destinationDescription mentions 'popular', count how many destinations have such a description, and group these results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "%popular%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "List all travel destinations where the destinationDescription mentions 'popular', count how many destinations have such a description, and group these results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "popular", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 232, + "database_schema_index": 3, + "natural_language_query": "Find all destinations in TravelDestinations where the destinationDescription contains the word 'beach', and count how many such destinations exist.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find all destinations in TravelDestinations where the destinationDescription contains the word 'beach', and count how many such destinations exist.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "%beach%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 233, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations where the destinationDescription includes 'beach', group the results by destinationName and count how many of these destinations are popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations where the destinationDescription includes 'beach', group the results by destinationName and count how many of these destinations are popular.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations where the destinationDescription includes 'beach', group the results by destinationName and count how many of these destinations are popular.", + "target_collection": "Travel_destinations", + "search_query": "beach", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 234, + "database_schema_index": 3, + "natural_language_query": "Show me travel destinations that include 'Beach' in their destinationName and count how many of them are popular using the popular attribute.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Show me travel destinations that include 'Beach' in their destinationName and count how many of them are popular using the popular attribute.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "Beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Show me travel destinations that include 'Beach' in their destinationName and count how many of them are popular using the popular attribute.", + "target_collection": "Travel Destinations", + "search_query": "Beach", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 235, + "database_schema_index": 3, + "natural_language_query": "Find all travel destinations where the destinationDescription contains the keyword 'beach', and group the results by whether or not the destination is popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find all travel destinations where the destinationDescription contains the keyword 'beach', and group the results by whether or not the destination is popular.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all travel destinations where the destinationDescription contains the keyword 'beach', and group the results by whether or not the destination is popular.", + "target_collection": "Travel_destinations", + "search_query": "beach", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "isPopular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 236, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations with descriptions that contain the keyword 'beaches' in destinationDescription.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations with descriptions that contain the keyword 'beaches' in destinationDescription.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "beaches" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations with descriptions that contain the keyword 'beaches' in destinationDescription.", + "target_collection": "TravelDestinations", + "search_query": "beaches", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 237, + "database_schema_index": 3, + "natural_language_query": "Find the average cost of all travel destinations that are popular, and group the results by each destination name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find the average cost of all travel destinations that are popular, and group the results by each destination name.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the average cost of all travel destinations that are popular, and group the results by each destination name.", + "target_collection": "Travel_destinations", + "search_query": "popular", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "cost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destination_name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 238, + "database_schema_index": 3, + "natural_language_query": "Find the total sum of packagePrice for all travel packages where discountAvailable is true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find the total sum of packagePrice for all travel packages where discountAvailable is true.", + "target_collection": "TravelPackages", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "discountAvailable", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the total sum of packagePrice for all travel packages where discountAvailable is true.", + "target_collection": "Travel packages", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "discountAvailable", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 239, + "database_schema_index": 3, + "natural_language_query": "List and categorize all popular travel destinations by their names, and for each destination, count the number of detailed descriptions available, ensuring that only destinations currently popular among tourists are included.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "List and categorize all popular travel destinations by their names, and for each destination, count the number of detailed descriptions available, ensuring that only destinations currently popular among tourists are included.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "List and categorize all popular travel destinations by their names, and for each destination, count the number of detailed descriptions available, ensuring that only destinations currently popular among tourists are included.", + "target_collection": "TravelDestinations", + "search_query": "popular travel destinations", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + }, + { + "query_index": 240, + "database_schema_index": 3, + "natural_language_query": "Retrieve destinations with destinationName that are currently popular, then count the number of unique destinationName values.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Retrieve destinations with destinationName that are currently popular, then count the number of unique destinationName values.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Retrieve destinations with destinationName that are currently popular, then count the number of unique destinationName values.", + "target_collection": "Destinations", + "search_query": "currently popular", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 241, + "database_schema_index": 3, + "natural_language_query": "Find me all travel packages where there is a discountAvailable, count how many packages have a discount and organize the results by packageName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find me all travel packages where there is a discountAvailable, count how many packages have a discount and organize the results by packageName.", + "target_collection": "TravelPackages", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "discountAvailable", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "packageName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find me all travel packages where there is a discountAvailable, count how many packages have a discount and organize the results by packageName.", + "target_collection": "TravelPackages", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "discountAvailable", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "discountAvailable", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "packageName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 242, + "database_schema_index": 3, + "natural_language_query": "Find all travel destinations where the destination is currently popular, and calculate the percentage of all travel destinations that are popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find all travel destinations where the destination is currently popular, and calculate the percentage of all travel destinations that are popular.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all travel destinations where the destination is currently popular, and calculate the percentage of all travel destinations that are popular.", + "target_collection": "Travel Destinations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 243, + "database_schema_index": 3, + "natural_language_query": "Find popular travel destinations, where 'popular' equals true, and group results by 'destinationName'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find popular travel destinations, where 'popular' equals true, and group results by 'destinationName'.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find popular travel destinations, where 'popular' equals true, and group results by 'destinationName'.", + "target_collection": "Travel_destinations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 244, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that are popular among tourists.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that are popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that are popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": "popular among tourists", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 245, + "database_schema_index": 3, + "natural_language_query": "Count the number of travel agents grouped by their availability status, using the yearsOfExperience property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Count the number of travel agents grouped by their availability status, using the yearsOfExperience property.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "availableNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Count the number of travel agents grouped by their availability status, using the yearsOfExperience property.", + "target_collection": "Travel agents", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "availabilityStatus", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 246, + "database_schema_index": 3, + "natural_language_query": "What is the average yearsOfExperience for all travel agents in the TravelAgents collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What is the average yearsOfExperience for all travel agents in the TravelAgents collection?", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average yearsOfExperience for all travel agents in the TravelAgents collection?", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 247, + "database_schema_index": 3, + "natural_language_query": "What is the count of each travel destination name grouped by whether the destination is popular?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What is the count of each travel destination name grouped by whether the destination is popular?", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the count of each travel destination name grouped by whether the destination is popular?", + "target_collection": "Travel_destinations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "popular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 248, + "database_schema_index": 3, + "natural_language_query": "What is the most common destination name in the Travel Destinations collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What is the most common destination name in the Travel Destinations collection?", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the most common destination name in the Travel Destinations collection?", + "target_collection": "Travel Destinations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 249, + "database_schema_index": 3, + "natural_language_query": "Show the percentage of popular destinations for each destinationName by grouping the destinations and calculating how many are marked as popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Show the percentage of popular destinations for each destinationName by grouping the destinations and calculating how many are marked as popular.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show the percentage of popular destinations for each destinationName by grouping the destinations and calculating how many are marked as popular.", + "target_collection": "Destinations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 250, + "database_schema_index": 3, + "natural_language_query": "Count how many travel destinations are currently popular and calculate the percentage of popular destinations in the TravelDestinations collection.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Count how many travel destinations are currently popular and calculate the percentage of popular destinations in the TravelDestinations collection.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Count how many travel destinations are currently popular and calculate the percentage of popular destinations in the TravelDestinations collection.", + "target_collection": "TravelDestinations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isPopular", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "isPopular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 251, + "database_schema_index": 3, + "natural_language_query": "Group all travel destinations by the boolean property popular and determine the averageVisitCost for each group to understand the cost difference between popular and non-popular destinations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Group all travel destinations by the boolean property popular and determine the averageVisitCost for each group to understand the cost difference between popular and non-popular destinations.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "Group all travel destinations by the boolean property popular and determine the averageVisitCost for each group to understand the cost difference between popular and non-popular destinations.", + "target_collection": "Travel_destinations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 252, + "database_schema_index": 3, + "natural_language_query": "Explore art pieces of significant historical relevance, filter those with a currentValuation greater than 1,000,000, calculate the average currentValuation, and group the results by their onDisplay status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Explore art pieces of significant historical relevance, filter those with a currentValuation greater than 1,000,000, calculate the average currentValuation, and group the results by their onDisplay status.", + "target_collection": "ArtPieces", + "search_query": "Explore art pieces of significant historical relevance", + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "onDisplay" + }, + "predicted_query": { + "corresponding_natural_language_query": "Explore art pieces of significant historical relevance, filter those with a currentValuation greater than 1,000,000, calculate the average currentValuation, and group the results by their onDisplay status.", + "target_collection": "ArtPieces", + "search_query": "significant historical relevance", + "limit": 5, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "onDisplay", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 253, + "database_schema_index": 3, + "natural_language_query": "Find the average currentValuation of art pieces with significant historical details in their artPieceHistory where the currentValuation is greater than 1,000,000.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find the average currentValuation of art pieces with significant historical details in their artPieceHistory where the currentValuation is greater than 1,000,000.", + "target_collection": "ArtPieces", + "search_query": "Explore notable art pieces with historical significance described in their artPieceHistory", + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the average currentValuation of art pieces with significant historical details in their artPieceHistory where the currentValuation is greater than 1,000,000.", + "target_collection": "Art pieces", + "search_query": "significant historical details in artPieceHistory", + "limit": 5, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 254, + "database_schema_index": 3, + "natural_language_query": "Explore exhibitions that feature modern art and innovative installations, focusing only on those with an averageVisitorCount above 100, grouped by the exhibitionTitle to identify how many unique exhibitions match this criterion.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Explore exhibitions that feature modern art and innovative installations, focusing only on those with an averageVisitorCount above 100, grouped by the exhibitionTitle to identify how many unique exhibitions match this criterion.", + "target_collection": "Exhibitions", + "search_query": "modern art and innovative installations", + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Explore exhibitions that feature modern art and innovative installations, focusing only on those with an averageVisitorCount above 100, grouped by the exhibitionTitle to identify how many unique exhibitions match this criterion.", + "target_collection": "Exhibitions", + "search_query": "modern art and innovative installations", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 255, + "database_schema_index": 3, + "natural_language_query": "Find exhibitions with descriptions about exploring the influence of Impressionism, where the averageVisitorCount is greater than 500, and count unique exhibition titles.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions with descriptions about exploring the influence of Impressionism, where the averageVisitorCount is greater than 500, and count unique exhibition titles.", + "target_collection": "Exhibitions", + "search_query": "exploring the influence of Impressionism", + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions with descriptions about exploring the influence of Impressionism, where the averageVisitorCount is greater than 500, and count unique exhibition titles.", + "target_collection": "Exhibitions", + "search_query": "exploring the influence of Impressionism", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "title", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "title", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 256, + "database_schema_index": 4, + "natural_language_query": "Find top museums highlighting Renaissance art, where entry fees are no more than 20, group results by exhibitHighlights, and determine how many are open today.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find top museums highlighting Renaissance art, where entry fees are no more than 20, group results by exhibitHighlights, and determine how many are open today.", + "target_collection": "Museums", + "search_query": "Top museums highlighting Renaissance art", + "integer_property_filter": { + "property_name": "entryFee", + "operator": "<=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitHighlights" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find top museums highlighting Renaissance art, where entry fees are no more than 20, group results by exhibitHighlights, and determine how many are open today.", + "target_collection": "Museums", + "search_query": "Renaissance art", + "limit": 5, + "integer_property_filter": { + "property_name": "entryFee", + "operator": "<=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitHighlights", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 257, + "database_schema_index": 4, + "natural_language_query": "List exhibitions with cultural themes in their exhibitionDescription that have an averageVisitorCount greater than 100, and summarize how many of these exhibitions are currentlyRunning.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "List exhibitions with cultural themes in their exhibitionDescription that have an averageVisitorCount greater than 100, and summarize how many of these exhibitions are currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": "cultural themes", + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "List exhibitions with cultural themes in their exhibitionDescription that have an averageVisitorCount greater than 100, and summarize how many of these exhibitions are currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": "cultural themes", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyRunning", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 258, + "database_schema_index": 4, + "natural_language_query": "Find museums where the exhibit highlights emphasize historical significance, filter for museums with entry fees exceeding 10, and group the results by each museum's name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums where the exhibit highlights emphasize historical significance, filter for museums with entry fees exceeding 10, and group the results by each museum's name.", + "target_collection": "Museums", + "search_query": "exhibitHighlights", + "integer_property_filter": { + "property_name": "entryFee", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums where the exhibit highlights emphasize historical significance, filter for museums with entry fees exceeding 10, and group the results by each museum's name.", + "target_collection": "Museums", + "search_query": "exhibit highlights emphasize historical significance", + "limit": 5, + "integer_property_filter": { + "property_name": "entryFees", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 259, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibitHighlights relevant to 'Impressionist art' that also have an entryFee greater than $10.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibitHighlights relevant to 'Impressionist art' that also have an entryFee greater than $10.", + "target_collection": "Museums", + "search_query": "Impressionist art", + "integer_property_filter": { + "property_name": "entryFee", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibitHighlights relevant to 'Impressionist art' that also have an entryFee greater than $10.", + "target_collection": "Museums", + "search_query": "exhibitHighlights relevant to 'Impressionist art'", + "limit": 5, + "integer_property_filter": { + "property_name": "entryFee", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 260, + "database_schema_index": 4, + "natural_language_query": "Search for art pieces with significant historical relevance using their artPieceHistory, filter for those that have 'Monet' in artPieceName, calculate the average of currentValuation, and group the results by their onDisplay status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Search for art pieces with significant historical relevance using their artPieceHistory, filter for those that have 'Monet' in artPieceName, calculate the average of currentValuation, and group the results by their onDisplay status.", + "target_collection": "ArtPieces", + "search_query": "Find artworks with significant historical relevance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceName", + "operator": "LIKE", + "value": "%Monet%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "onDisplay" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for art pieces with significant historical relevance using their artPieceHistory, filter for those that have 'Monet' in artPieceName, calculate the average of currentValuation, and group the results by their onDisplay status.", + "target_collection": "ArtPieces", + "search_query": "significant historical relevance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceName", + "operator": "LIKE", + "value": "Monet" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "onDisplay", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 261, + "database_schema_index": 4, + "natural_language_query": "Search for museums whose exhibitHighlights semantically match 'famous art exhibits with rich historical significance', where museumName is exactly 'Louvre', and compute the sum of entryFee.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Search for museums whose exhibitHighlights semantically match 'famous art exhibits with rich historical significance', where museumName is exactly 'Louvre', and compute the sum of entryFee.", + "target_collection": "Museums", + "search_query": "explore famous art exhibits with rich historical significance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "=", + "value": "Louvre" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for museums whose exhibitHighlights semantically match 'famous art exhibits with rich historical significance', where museumName is exactly 'Louvre', and compute the sum of entryFee.", + "target_collection": "Museums", + "search_query": "famous art exhibits with rich historical significance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "=", + "value": "Louvre" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 262, + "database_schema_index": 4, + "natural_language_query": "Retrieve museums with exhibit highlights similar to 'ancient artifacts', filter specifically on museums named 'Smithsonian', count the unique exhibit highlights available, and group the results by the museum name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Retrieve museums with exhibit highlights similar to 'ancient artifacts', filter specifically on museums named 'Smithsonian', count the unique exhibit highlights available, and group the results by the museum name.", + "target_collection": "Museums", + "search_query": "Find museums with exhibit highlights similar to 'ancient artifacts'.", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "=", + "value": "Smithsonian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Retrieve museums with exhibit highlights similar to 'ancient artifacts', filter specifically on museums named 'Smithsonian', count the unique exhibit highlights available, and group the results by the museum name.", + "target_collection": "Museums", + "search_query": "ancient artifacts", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Smithsonian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 263, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions that focus on impressionist themes, check if they are currently running, and count the total number of distinct exhibition titles.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions that focus on impressionist themes, check if they are currently running, and count the total number of distinct exhibition titles.", + "target_collection": "Exhibitions", + "search_query": "Explore exhibitions that focus on impressionist themes in exhibitionDescription", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions that focus on impressionist themes, check if they are currently running, and count the total number of distinct exhibition titles.", + "target_collection": "Exhibitions", + "search_query": "impressionist themes", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "title", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 264, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibits highlighting the historical significance of Vincent van Gogh's pieces using semantic search, filter for museums whose names include 'National', aggregate by counting the number of museums open today, and group results by museumName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibits highlighting the historical significance of Vincent van Gogh's pieces using semantic search, filter for museums whose names include 'National', aggregate by counting the number of museums open today, and group results by museumName.", + "target_collection": "Museums", + "search_query": "historical significance of Vincent van Gogh's pieces", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "LIKE", + "value": "National" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibits highlighting the historical significance of Vincent van Gogh's pieces using semantic search, filter for museums whose names include 'National', aggregate by counting the number of museums open today, and group results by museumName.", + "target_collection": "Museums", + "search_query": "exhibits highlighting the historical significance of Vincent van Gogh's pieces", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "LIKE", + "value": "%National%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 265, + "database_schema_index": 4, + "natural_language_query": "Find museums that are most relevant to \"historical importance\" based on exhibitHighlights. Include only those museums where the museumName contains \"Art Gallery\", and show the percentage of these that are openToday.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums that are most relevant to \"historical importance\" based on exhibitHighlights. Include only those museums where the museumName contains \"Art Gallery\", and show the percentage of these that are openToday.", + "target_collection": "Museums", + "search_query": "historical importance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "LIKE", + "value": "Art Gallery" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums that are most relevant to \"historical importance\" based on exhibitHighlights. Include only those museums where the museumName contains \"Art Gallery\", and show the percentage of these that are openToday.", + "target_collection": "Museums", + "search_query": "historical importance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "LIKE", + "value": "%Art Gallery%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 266, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions that are about modern art with innovative displays by looking at the exhibition descriptions. Filter these exhibitions to include only those with 'Masterpiece' in their titles. Then, group the results based on whether the exhibitions are currently running or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions that are about modern art with innovative displays by looking at the exhibition descriptions. Filter these exhibitions to include only those with 'Masterpiece' in their titles. Then, group the results based on whether the exhibitions are currently running or not.", + "target_collection": "Exhibitions", + "search_query": "Discover exhibitions about modern art with a focus on innovative displays", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitionTitle", + "operator": "LIKE", + "value": "Masterpiece" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions that are about modern art with innovative displays by looking at the exhibition descriptions. Filter these exhibitions to include only those with 'Masterpiece' in their titles. Then, group the results based on whether the exhibitions are currently running or not.", + "target_collection": "Exhibitions", + "search_query": "modern art with innovative displays", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "title", + "operator": "LIKE", + "value": "%Masterpiece%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "running", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 267, + "database_schema_index": 4, + "natural_language_query": "Which museums, including those with names similar to 'Art Museum', have collections described as having significant cultural impact?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Which museums, including those with names similar to 'Art Museum', have collections described as having significant cultural impact?", + "target_collection": "Museums", + "search_query": "The cultural significance of the museum's collection and unique exhibits that attract thousands of visitors.", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "LIKE", + "value": "*Art Museum*" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Which museums, including those with names similar to 'Art Museum', have collections described as having significant cultural impact?", + "target_collection": "Museums", + "search_query": "collections with significant cultural impact", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "%Art Museum%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 268, + "database_schema_index": 4, + "natural_language_query": "What are the museums, grouped by their names, that have exhibit highlights including renaissance art and are open today, along with the sum of their entry fees?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "What are the museums, grouped by their names, that have exhibit highlights including renaissance art and are open today, along with the sum of their entry fees?", + "target_collection": "Museums", + "search_query": "exhibitHighlights including 'renaissance art'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the museums, grouped by their names, that have exhibit highlights including renaissance art and are open today, along with the sum of their entry fees?", + "target_collection": "Museums", + "search_query": "exhibit highlights including renaissance art", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 269, + "database_schema_index": 4, + "natural_language_query": "Find currently running exhibitions that explore the theme of Renaissance art and calculate the average visitor count.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find currently running exhibitions that explore the theme of Renaissance art and calculate the average visitor count.", + "target_collection": "Exhibitions", + "search_query": "Explore the theme of Renaissance art.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find currently running exhibitions that explore the theme of Renaissance art and calculate the average visitor count.", + "target_collection": "Exhibitions", + "search_query": "theme of Renaissance art", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "visitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9, + "error": null + }, + { + "query_index": 270, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions with thematic content related to 'contemporary art' that are currently running, categorize them by exhibitionTitle, and count the number of occurrences of each exhibitionTitle.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions with thematic content related to 'contemporary art' that are currently running, categorize them by exhibitionTitle, and count the number of occurrences of each exhibitionTitle.", + "target_collection": "Exhibitions", + "search_query": "contemporary art", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions with thematic content related to 'contemporary art' that are currently running, categorize them by exhibitionTitle, and count the number of occurrences of each exhibitionTitle.", + "target_collection": "Exhibitions", + "search_query": "contemporary art", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "running", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitionTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 271, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibits that have historical significance and are open today, and count the number of unique museum names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibits that have historical significance and are open today, and count the number of unique museum names.", + "target_collection": "Museums", + "search_query": "Search for museums that have exhibits with historical significance in their exhibitHighlights", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibits that have historical significance and are open today, and count the number of unique museum names.", + "target_collection": "Museums", + "search_query": "exhibits with historical significance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 272, + "database_schema_index": 4, + "natural_language_query": "Explore museums with notable exhibit highlights that include ancient history artifacts, find which ones are open today, count the total number of museums open today, and segment the results by the museum name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Explore museums with notable exhibit highlights that include ancient history artifacts, find which ones are open today, count the total number of museums open today, and segment the results by the museum name.", + "target_collection": "Museums", + "search_query": "Explore museums with notable exhibitHighlights that include ancient history artifacts", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Explore museums with notable exhibit highlights that include ancient history artifacts, find which ones are open today, count the total number of museums open today, and segment the results by the museum name.", + "target_collection": "Museums", + "search_query": "notable exhibit highlights that include ancient history artifacts", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 273, + "database_schema_index": 4, + "natural_language_query": "Find museums that have notable exhibits with historical significance, indicate if they are open today, and provide the percentage of museums that are indeed open today.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums that have notable exhibits with historical significance, indicate if they are open today, and provide the percentage of museums that are indeed open today.", + "target_collection": "Museums", + "search_query": "exhibitHighlights", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums that have notable exhibits with historical significance, indicate if they are open today, and provide the percentage of museums that are indeed open today.", + "target_collection": "Museums", + "search_query": "notable exhibits with historical significance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 274, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibits related to the Renaissance that are open today, and group the results by the museum's name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibits related to the Renaissance that are open today, and group the results by the museum's name.", + "target_collection": "Museums", + "search_query": "Renaissance exhibits", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibits related to the Renaissance that are open today, and group the results by the museum's name.", + "target_collection": "Museums", + "search_query": "exhibits related to the Renaissance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 275, + "database_schema_index": 4, + "natural_language_query": "Find museums that highlight Renaissance art exhibits using semantic search on the exhibitHighlights property and filter to only those where openToday is true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums that highlight Renaissance art exhibits using semantic search on the exhibitHighlights property and filter to only those where openToday is true.", + "target_collection": "Museums", + "search_query": "Find museums that highlight Renaissance art exhibits", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums that highlight Renaissance art exhibits using semantic search on the exhibitHighlights property and filter to only those where openToday is true.", + "target_collection": "Museums", + "search_query": "Renaissance art exhibits", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 276, + "database_schema_index": 4, + "natural_language_query": "Find museums that have Impressionist art mentioned in their exhibitHighlights, calculate the average entryFee, and group results based on whether they are openToday.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums that have Impressionist art mentioned in their exhibitHighlights, calculate the average entryFee, and group results based on whether they are openToday.", + "target_collection": "Museums", + "search_query": "Explore museums showcasing Impressionist art in their exhibitHighlights.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums that have Impressionist art mentioned in their exhibitHighlights, calculate the average entryFee, and group results based on whether they are openToday.", + "target_collection": "Museums", + "search_query": "Impressionist art", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 277, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions focused on impressionism and calculate the total average visitor count using the averageVisitorCount property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions focused on impressionism and calculate the total average visitor count using the averageVisitorCount property.", + "target_collection": "Exhibitions", + "search_query": "Explore exhibitions focusing on impressionism.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions focused on impressionism and calculate the total average visitor count using the averageVisitorCount property.", + "target_collection": "Exhibitions", + "search_query": "impressionism", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 278, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibits about Renaissance art, categorize the results by their entryFee, and show the 5 most common exhibitHighlights.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibits about Renaissance art, categorize the results by their entryFee, and show the 5 most common exhibitHighlights.", + "target_collection": "Museums", + "search_query": "Search for museums that have exhibits about Renaissance art.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "entryFee" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibits about Renaissance art, categorize the results by their entryFee, and show the 5 most common exhibitHighlights.", + "target_collection": "Museums", + "search_query": "exhibits about Renaissance art", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "entryFee", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 279, + "database_schema_index": 4, + "natural_language_query": "Which museums have the most notable exhibit highlights according to their exhibitHighlights description, and how many distinct museum names are there?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Which museums have the most notable exhibit highlights according to their exhibitHighlights description, and how many distinct museum names are there?", + "target_collection": "Museums", + "search_query": "Find museums with notable exhibits mentioned in exhibitHighlights", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Which museums have the most notable exhibit highlights according to their exhibitHighlights description, and how many distinct museum names are there?", + "target_collection": "Museums", + "search_query": "notable exhibit highlights", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 280, + "database_schema_index": 4, + "natural_language_query": "Identify exhibitions focusing on historical themes, group them by their current status of being open to the public, and compute the percentage of exhibitions that are currently running.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Identify exhibitions focusing on historical themes, group them by their current status of being open to the public, and compute the percentage of exhibitions that are currently running.", + "target_collection": "Exhibitions", + "search_query": "Explore exhibitions with themes of historical significance in their exhibitionDescription.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyRunning", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "currentlyRunning" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify exhibitions focusing on historical themes, group them by their current status of being open to the public, and compute the percentage of exhibitions that are currently running.", + "target_collection": "Exhibitions", + "search_query": "historical themes", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToPublic", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "openToPublic", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 281, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibitions related to the Renaissance period and count how many of these museums are open today.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibitions related to the Renaissance period and count how many of these museums are open today.", + "target_collection": "Museums", + "search_query": "Discover museums with exhibitions related to the Renaissance period in their exhibitHighlights property.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibitions related to the Renaissance period and count how many of these museums are open today.", + "target_collection": "Museums", + "search_query": "exhibitions related to the Renaissance period", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 282, + "database_schema_index": 4, + "natural_language_query": "Find museums where the exhibitHighlights mention ancient artifacts and group the results by whether they are openToday.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums where the exhibitHighlights mention ancient artifacts and group the results by whether they are openToday.", + "target_collection": "Museums", + "search_query": "Find museums where exhibitHighlights mention ancient artifacts", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums where the exhibitHighlights mention ancient artifacts and group the results by whether they are openToday.", + "target_collection": "Museums", + "search_query": "ancient artifacts", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 283, + "database_schema_index": 4, + "natural_language_query": "What are the museums with exhibit highlights focusing on ancient civilizations?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "What are the museums with exhibit highlights focusing on ancient civilizations?", + "target_collection": "Museums", + "search_query": "Find museums with exhibit highlights related to ancient civilizations", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the museums with exhibit highlights focusing on ancient civilizations?", + "target_collection": "Museums", + "search_query": "exhibit highlights focusing on ancient civilizations", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 284, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions where the averageVisitorCount is at least 100, group them by exhibitionTitle, and compute the mean averageVisitorCount for each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is at least 100, group them by exhibitionTitle, and compute the mean averageVisitorCount for each group.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">=", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is at least 100, group them by exhibitionTitle, and compute the mean averageVisitorCount for each group.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">=", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 285, + "database_schema_index": 4, + "natural_language_query": "Find all exhibitions where the averageVisitorCount is greater than 500, and calculate the total sum of averageVisitorCount for these exhibitions.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find all exhibitions where the averageVisitorCount is greater than 500, and calculate the total sum of averageVisitorCount for these exhibitions.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all exhibitions where the averageVisitorCount is greater than 500, and calculate the total sum of averageVisitorCount for these exhibitions.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 286, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 200, count the number of different exhibition titles, and group the results by whether the exhibition is currentlyRunning.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 200, count the number of different exhibition titles, and group the results by whether the exhibition is currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 200 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 200, count the number of different exhibition titles, and group the results by whether the exhibition is currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 200 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "title", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 287, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 1000 and count how many unique exhibitionDescription texts there are.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 1000 and count how many unique exhibitionDescription texts there are.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 1000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 1000 and count how many unique exhibitionDescription texts there are.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 1000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitionDescription", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 288, + "database_schema_index": 4, + "natural_language_query": "Find museums where the entryFee is 15 or less, aggregate the percentage of museums that are openToday, and group the results by museumName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums where the entryFee is 15 or less, aggregate the percentage of museums that are openToday, and group the results by museumName.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": { + "property_name": "entryFee", + "operator": "<=", + "value": 15 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums where the entryFee is 15 or less, aggregate the percentage of museums that are openToday, and group the results by museumName.", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "entryFee", + "operator": "<=", + "value": 15 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 289, + "database_schema_index": 4, + "natural_language_query": "Find art pieces from ArtPieces with a currentValuation of at least 1,000,000 and count how many of these are onDisplay.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find art pieces from ArtPieces with a currentValuation of at least 1,000,000 and count how many of these are onDisplay.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">=", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find art pieces from ArtPieces with a currentValuation of at least 1,000,000 and count how many of these are onDisplay.", + "target_collection": "ArtPieces", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">=", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "onDisplay", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 290, + "database_schema_index": 4, + "natural_language_query": "Show exhibitions where the averageVisitorCount is greater than or equal to 100, and group the results by the currentlyRunning status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Show exhibitions where the averageVisitorCount is greater than or equal to 100, and group the results by the currentlyRunning status.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">=", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show exhibitions where the averageVisitorCount is greater than or equal to 100, and group the results by the currentlyRunning status.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">=", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 291, + "database_schema_index": 4, + "natural_language_query": "Find art pieces with a currentValuation greater than 1,000,000.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find art pieces with a currentValuation greater than 1,000,000.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find art pieces with a currentValuation greater than 1,000,000.", + "target_collection": "ArtPieces", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 292, + "database_schema_index": 4, + "natural_language_query": "For museums that are currently open, calculate the average entry fee grouped by the name of the museum.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "For museums that are currently open, calculate the average entry fee grouped by the name of the museum.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "For museums that are currently open, calculate the average entry fee grouped by the name of the museum.", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 293, + "database_schema_index": 4, + "natural_language_query": "Find the average currentValuation of all art pieces in the ArtPieces collection whose artPieceHistory contains the word 'Renaissance'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find the average currentValuation of all art pieces in the ArtPieces collection whose artPieceHistory contains the word 'Renaissance'.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceHistory", + "operator": "LIKE", + "value": "Renaissance" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the average currentValuation of all art pieces in the ArtPieces collection whose artPieceHistory contains the word 'Renaissance'.", + "target_collection": "ArtPieces", + "search_query": "Renaissance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 294, + "database_schema_index": 4, + "natural_language_query": "Count the number of unique museums with exhibitHighlights containing 'historical significance' and group these counts by whether or not the museum is open today.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Count the number of unique museums with exhibitHighlights containing 'historical significance' and group these counts by whether or not the museum is open today.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitHighlights", + "operator": "LIKE", + "value": "historical significance" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday" + }, + "predicted_query": { + "corresponding_natural_language_query": "Count the number of unique museums with exhibitHighlights containing 'historical significance' and group these counts by whether or not the museum is open today.", + "target_collection": "Museums", + "search_query": "historical significance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + }, + { + "query_index": 295, + "database_schema_index": 4, + "natural_language_query": "Find art pieces where \"Monet\" is mentioned in artPieceHistory, and count the number of unique artPieceName values.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find art pieces where \"Monet\" is mentioned in artPieceHistory, and count the number of unique artPieceName values.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceHistory", + "operator": "LIKE", + "value": "Monet" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find art pieces where \"Monet\" is mentioned in artPieceHistory, and count the number of unique artPieceName values.", + "target_collection": "ArtPieces", + "search_query": "Monet", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "artPieceName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 296, + "database_schema_index": 4, + "natural_language_query": "Find museums where exhibitHighlights contain the keyword 'ancient artifacts', calculate what percentage of these museums are openToday, and group the museums by entryFee to see the distribution across different price categories.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums where exhibitHighlights contain the keyword 'ancient artifacts', calculate what percentage of these museums are openToday, and group the museums by entryFee to see the distribution across different price categories.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitHighlights", + "operator": "LIKE", + "value": "ancient artifacts" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "entryFee" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums where exhibitHighlights contain the keyword 'ancient artifacts', calculate what percentage of these museums are openToday, and group the museums by entryFee to see the distribution across different price categories.", + "target_collection": "Museums", + "search_query": "ancient artifacts", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "entryFee", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 297, + "database_schema_index": 4, + "natural_language_query": "Find museums that mention 'renaissance' in their exhibitHighlights and count how many of them are open today.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums that mention 'renaissance' in their exhibitHighlights and count how many of them are open today.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitHighlights", + "operator": "LIKE", + "value": "renaissance" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums that mention 'renaissance' in their exhibitHighlights and count how many of them are open today.", + "target_collection": "Museums", + "search_query": "renaissance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 298, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions where the exhibitionTitle contains 'Impressionism' and group the results by currentlyRunning status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions where the exhibitionTitle contains 'Impressionism' and group the results by currentlyRunning status.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitionTitle", + "operator": "LIKE", + "value": "Impressionism" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions where the exhibitionTitle contains 'Impressionism' and group the results by currentlyRunning status.", + "target_collection": "Exhibitions", + "search_query": "exhibitionTitle:Impressionism", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 299, + "database_schema_index": 4, + "natural_language_query": "Find art pieces where the artPieceName contains the word 'Starry'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find art pieces where the artPieceName contains the word 'Starry'.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceName", + "operator": "LIKE", + "value": "%Starry%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find art pieces where the artPieceName contains the word 'Starry'.", + "target_collection": "ArtPieces", + "search_query": "Starry", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 300, + "database_schema_index": 4, + "natural_language_query": "Find a summary of the total averageVisitorCount for each exhibitionTitle where the exhibition is currentlyRunning.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find a summary of the total averageVisitorCount for each exhibitionTitle where the exhibition is currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find a summary of the total averageVisitorCount for each exhibitionTitle where the exhibition is currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 301, + "database_schema_index": 4, + "natural_language_query": "Find all art pieces that are on display and calculate the total current valuation of these pieces using the `onDisplay` property for filtering and `currentValuation` property for aggregation.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find all art pieces that are on display and calculate the total current valuation of these pieces using the `onDisplay` property for filtering and `currentValuation` property for aggregation.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "onDisplay", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all art pieces that are on display and calculate the total current valuation of these pieces using the `onDisplay` property for filtering and `currentValuation` property for aggregation.", + "target_collection": "ArtPieces", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "onDisplay", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 302, + "database_schema_index": 4, + "natural_language_query": "Retrieve a list of all museums that are open today, group them by the museumName, and within each group, count the occurrence of each unique exhibitHighlights.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Retrieve a list of all museums that are open today, group them by the museumName, and within each group, count the occurrence of each unique exhibitHighlights.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Retrieve a list of all museums that are open today, group them by the museumName, and within each group, count the occurrence of each unique exhibitHighlights.", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 303, + "database_schema_index": 4, + "natural_language_query": "Find museums in the Museums collection that are open today (using the 'openToday' boolean property filter), and determine the most common exhibit highlights among them (using text property aggregation on 'exhibitHighlights').", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums in the Museums collection that are open today (using the 'openToday' boolean property filter), and determine the most common exhibit highlights among them (using text property aggregation on 'exhibitHighlights').", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums in the Museums collection that are open today (using the 'openToday' boolean property filter), and determine the most common exhibit highlights among them (using text property aggregation on 'exhibitHighlights').", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 304, + "database_schema_index": 4, + "natural_language_query": "Show the percentage of exhibitions on 'exhibitionTitle' that are currently running. Group the results by exhibitionTitle to determine which specific exhibitions have the highest visitor count while currentlyRunning.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Show the percentage of exhibitions on 'exhibitionTitle' that are currently running. Group the results by exhibitionTitle to determine which specific exhibitions have the highest visitor count while currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyRunning", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show the percentage of exhibitions on 'exhibitionTitle' that are currently running. Group the results by exhibitionTitle to determine which specific exhibitions have the highest visitor count while currentlyRunning.", + "target_collection": "ExhibitionTitle", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyRunning", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "exhibitionTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 305, + "database_schema_index": 4, + "natural_language_query": "Count how many exhibitions are currently open to the public and find those that are open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Count how many exhibitions are currently open to the public and find those that are open.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Count how many exhibitions are currently open to the public and find those that are open.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isOpenToPublic", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isOpenToPublic", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 306, + "database_schema_index": 4, + "natural_language_query": "List all museums that are open today and group them by their entry fee.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "List all museums that are open today and group them by their entry fee.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "entryFee" + }, + "predicted_query": { + "corresponding_natural_language_query": "List all museums that are open today and group them by their entry fee.", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "entryFee", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 307, + "database_schema_index": 4, + "natural_language_query": "Find museums where the openToday flag is set to true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums where the openToday flag is set to true.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums where the openToday flag is set to true.", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 308, + "database_schema_index": 4, + "natural_language_query": "For each unique exhibitionTitle, determine the count of exhibitions that are currently running by aggregating over the currentlyRunning property and grouping the results by exhibitionTitle.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "For each unique exhibitionTitle, determine the count of exhibitions that are currently running by aggregating over the currentlyRunning property and grouping the results by exhibitionTitle.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "For each unique exhibitionTitle, determine the count of exhibitions that are currently running by aggregating over the currentlyRunning property and grouping the results by exhibitionTitle.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyRunning", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "exhibitionTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 309, + "database_schema_index": 4, + "natural_language_query": "What is the mean of the averageVisitorCount in the Exhibitions collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "What is the mean of the averageVisitorCount in the Exhibitions collection?", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the mean of the averageVisitorCount in the Exhibitions collection?", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 310, + "database_schema_index": 4, + "natural_language_query": "What are the top 5 most common exhibit highlights in terms of descriptions for museums, grouped by each museum's name?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "What are the top 5 most common exhibit highlights in terms of descriptions for museums, grouped by each museum's name?", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the top 5 most common exhibit highlights in terms of descriptions for museums, grouped by each museum's name?", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "descriptions", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 311, + "database_schema_index": 4, + "natural_language_query": "What is the count of unique museum names in the Museums collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "What is the count of unique museum names in the Museums collection?", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the count of unique museum names in the Museums collection?", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 312, + "database_schema_index": 4, + "natural_language_query": "Find out how many museums are open today and group this information by museumName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find out how many museums are open today and group this information by museumName.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find out how many museums are open today and group this information by museumName.", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 313, + "database_schema_index": 4, + "natural_language_query": "Calculate the percentage of museums that are open today based on the openToday property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Calculate the percentage of museums that are open today based on the openToday property.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate the percentage of museums that are open today based on the openToday property.", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 314, + "database_schema_index": 4, + "natural_language_query": "Organize museums based on whether they are open today and calculate the average entry fee for each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Organize museums based on whether they are open today and calculate the average entry fee for each group.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday" + }, + "predicted_query": { + "corresponding_natural_language_query": "Organize museums based on whether they are open today and calculate the average entry fee for each group.", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + } + ] +} \ No newline at end of file diff --git a/src/test_gorilla/gpt-4o-mini-02-21-25.json b/src/test_gorilla/gpt-4o-mini-02-21-25.json new file mode 100644 index 0000000..2ef9dc8 --- /dev/null +++ b/src/test_gorilla/gpt-4o-mini-02-21-25.json @@ -0,0 +1,46310 @@ +{ + "timestamp": "2025-02-21T11:47:02.260025", + "model_name": "gpt-4o-mini", + "generate_with_models": false, + "total_queries": 315, + "successful_predictions": 260, + "failed_predictions": 55, + "average_ast_score": 0.8680769230769215, + "perfect_matches": 122, + "per_schema_scores": { + "0": 0.7078125000000003, + "1": 0.7468750000000005, + "2": 0.7550781250000003, + "3": 0.6753906250000002 + }, + "detailed_results": [ + { + "query_index": 0, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine, where the average rating is at least 4, count how many such restaurants there are, and group them by whether they are currently open or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine, where the average rating is at least 4, count how many such restaurants there are, and group them by whether they are currently open or not.", + "target_collection": "Restaurants", + "search_query": "Find restaurants with a cozy ambiance and Italian cuisine", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine, where the average rating is at least 4, count how many such restaurants there are, and group them by whether they are currently open or not.", + "target_collection": "Restaurants", + "search_query": "cozy ambiance Italian cuisine", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 1, + "database_schema_index": 0, + "natural_language_query": "Find Italian cuisine restaurants with a cozy ambiance that have an average rating of at least 4, plus provide the count of such restaurants that are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find Italian cuisine restaurants with a cozy ambiance that have an average rating of at least 4, plus provide the count of such restaurants that are currently open.", + "target_collection": "Restaurants", + "search_query": "Find restaurants with cozy ambiance and Italian cuisine", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find Italian cuisine restaurants with a cozy ambiance that have an average rating of at least 4, plus provide the count of such restaurants that are currently open.", + "target_collection": "Restaurants", + "search_query": "Italian cuisine restaurants with a cozy ambiance", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 2, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that match the description 'authentic Italian ambiance', have an averageRating greater than 4, list the top 5 most common restaurant names in this set, and partition the results based on whether the restaurant is currently open or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that match the description 'authentic Italian ambiance', have an averageRating greater than 4, list the top 5 most common restaurant names in this set, and partition the results based on whether the restaurant is currently open or not.", + "target_collection": "Restaurants", + "search_query": "authentic Italian ambiance", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that match the description 'authentic Italian ambiance', have an averageRating greater than 4, list the top 5 most common restaurant names in this set, and partition the results based on whether the restaurant is currently open or not.", + "target_collection": "Restaurants", + "search_query": "authentic Italian ambiance", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 3, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with a family-friendly ambiance and Italian cuisine rated with at least 4.5 in averageRating, and identify the top 3 most common descriptions.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with a family-friendly ambiance and Italian cuisine rated with at least 4.5 in averageRating, and identify the top 3 most common descriptions.", + "target_collection": "Restaurants", + "search_query": "Find restaurants with a family-friendly ambiance and Italian cuisine", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with a family-friendly ambiance and Italian cuisine rated with at least 4.5 in averageRating, and identify the top 3 most common descriptions.", + "target_collection": "Restaurants", + "search_query": "family-friendly ambiance Italian cuisine", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 4, + "database_schema_index": 0, + "natural_language_query": "Find restaurants offering Italian cuisine with a cozy atmosphere, with at least an average rating of 4.5. Also, calculate the percentage of these restaurants that are open and group results based on their open status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants offering Italian cuisine with a cozy atmosphere, with at least an average rating of 4.5. Also, calculate the percentage of these restaurants that are open and group results based on their open status.", + "target_collection": "Restaurants", + "search_query": "Find restaurants offering Italian cuisine with a cozy atmosphere", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants offering Italian cuisine with a cozy atmosphere, with at least an average rating of 4.5. Also, calculate the percentage of these restaurants that are open and group results based on their open status.", + "target_collection": "Restaurants", + "search_query": "Italian cuisine with a cozy atmosphere", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 5, + "database_schema_index": 0, + "natural_language_query": "Find Italian cuisine restaurants with descriptions containing 'Italian cuisine', with averageRating greater than 4.0, and calculate the percentage of these that are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find Italian cuisine restaurants with descriptions containing 'Italian cuisine', with averageRating greater than 4.0, and calculate the percentage of these that are currently open.", + "target_collection": "Restaurants", + "search_query": "Search for restaurants with descriptions containing 'Italian cuisine'", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find Italian cuisine restaurants with descriptions containing 'Italian cuisine', with averageRating greater than 4.0, and calculate the percentage of these that are currently open.", + "target_collection": "Restaurants", + "search_query": "Italian cuisine", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 6, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that are similar to Italian family-friendly places, have an averageRating of at least 4, and group them by whether they are currently open (openNow).", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that are similar to Italian family-friendly places, have an averageRating of at least 4, and group them by whether they are currently open (openNow).", + "target_collection": "Restaurants", + "search_query": "Italian, family-friendly ambiance", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that are similar to Italian family-friendly places, have an averageRating of at least 4, and group them by whether they are currently open (openNow).", + "target_collection": "Restaurants", + "search_query": "Italian family-friendly places", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 7, + "database_schema_index": 0, + "natural_language_query": "Find Italian restaurants with a cozy ambiance, and the averageRating must be greater than 4.0.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find Italian restaurants with a cozy ambiance, and the averageRating must be greater than 4.0.", + "target_collection": "Restaurants", + "search_query": "Looking for Italian restaurants with a cozy ambiance", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find Italian restaurants with a cozy ambiance, and the averageRating must be greater than 4.0.", + "target_collection": "Restaurants", + "search_query": "Italian restaurants with a cozy ambiance", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 8, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with an Italian ambiance and explicitly mentioned as family friendly in their description, calculate the average of each restaurant's averageRating, and group the results by restaurant name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with an Italian ambiance and explicitly mentioned as family friendly in their description, calculate the average of each restaurant's averageRating, and group the results by restaurant name.", + "target_collection": "Restaurants", + "search_query": "Italian ambiance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "family friendly" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with an Italian ambiance and explicitly mentioned as family friendly in their description, calculate the average of each restaurant's averageRating, and group the results by restaurant name.", + "target_collection": "Restaurants", + "search_query": "Italian ambiance family friendly", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 9, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that have a romantic ambiance using search query, filter the results to include only those where the name contains 'Ristorante', and count the number of these restaurants using the averageRating property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that have a romantic ambiance using search query, filter the results to include only those where the name contains 'Ristorante', and count the number of these restaurants using the averageRating property.", + "target_collection": "Restaurants", + "search_query": "romantic ambiance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "Ristorante" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that have a romantic ambiance using search query, filter the results to include only those where the name contains 'Ristorante', and count the number of these restaurants using the averageRating property.", + "target_collection": "Restaurants", + "search_query": "romantic ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "Ristorante" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 10, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with a cozy and modern ambiance that mention 'casual dining' in their description. Count the number of unique restaurant names and group the results by whether they are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with a cozy and modern ambiance that mention 'casual dining' in their description. Count the number of unique restaurant names and group the results by whether they are currently open.", + "target_collection": "Restaurants", + "search_query": "Cozy and modern ambiance with festive atmosphere", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "%casual dining%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 11, + "database_schema_index": 0, + "natural_language_query": "Search for restaurants similar in description and ambiance to those fitting the concept of cozy and modern cuisine, filter to only include restaurants named exactly 'Ocean View Grille', and count the occurrences of each restaurant name in the results.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Search for restaurants similar in description and ambiance to those fitting the concept of cozy and modern cuisine, filter to only include restaurants named exactly 'Ocean View Grille', and count the occurrences of each restaurant name in the results.", + "target_collection": "Restaurants", + "search_query": "Find the most relevant restaurants based on their description of the cuisine and ambiance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Ocean View Grille" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 12, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with a nature ambiance, having Italian cuisine in their description, calculate the percentage of restaurants currently open, and group them by their average rating to summarize.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with a nature ambiance, having Italian cuisine in their description, calculate the percentage of restaurants currently open, and group them by their average rating to summarize.", + "target_collection": "Restaurants", + "search_query": "nature ambiance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "Italian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with a nature ambiance, having Italian cuisine in their description, calculate the percentage of restaurants currently open, and group them by their average rating to summarize.", + "target_collection": "Restaurants", + "search_query": "nature ambiance Italian cuisine", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 13, + "database_schema_index": 0, + "natural_language_query": "Find restaurants similar to a cozy Italian restaurant with a great wine selection, include only those whose name contains 'Grill', and count how many of them are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants similar to a cozy Italian restaurant with a great wine selection, include only those whose name contains 'Grill', and count how many of them are currently open.", + "target_collection": "Restaurants", + "search_query": "A cozy Italian restaurant with a great wine selection", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "Grill" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants similar to a cozy Italian restaurant with a great wine selection, include only those whose name contains 'Grill', and count how many of them are currently open.", + "target_collection": "Restaurants", + "search_query": "cozy Italian restaurant with a great wine selection", + "limit": 5, + "integer_property_filter": { + "property_name": "totalCount", + "operator": ">", + "value": 0 + }, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "%Grill%" + }, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 14, + "database_schema_index": 0, + "natural_language_query": "Find restaurants offering authentic Italian cuisine while they are open now, and group these restaurants by their average rating.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants offering authentic Italian cuisine while they are open now, and group these restaurants by their average rating.", + "target_collection": "Restaurants", + "search_query": "authentic Italian cuisine", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants offering authentic Italian cuisine while they are open now, and group these restaurants by their average rating.", + "target_collection": "Restaurants", + "search_query": "authentic Italian cuisine", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 15, + "database_schema_index": 0, + "natural_language_query": "Search for restaurants that are famous for Italian cuisine using semantic search for 'cuisine' and 'ambiance', and additionally filter to show only those whose description explicitly contains the word 'romantic'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Search for restaurants that are famous for Italian cuisine using semantic search for 'cuisine' and 'ambiance', and additionally filter to show only those whose description explicitly contains the word 'romantic'.", + "target_collection": "Restaurants", + "search_query": "Find restaurants known for Italian cuisine with a romantic ambiance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "romantic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for restaurants that are famous for Italian cuisine using semantic search for 'cuisine' and 'ambiance', and additionally filter to show only those whose description explicitly contains the word 'romantic'.", + "target_collection": "Restaurants", + "search_query": "Italian cuisine ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "romantic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description.cuisine", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "description.cuisine", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 16, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that offer a romantic ambiance and Italian cuisine, ensure they are open now, calculate the average rating, and organize the results by each restaurant's name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that offer a romantic ambiance and Italian cuisine, ensure they are open now, calculate the average rating, and organize the results by each restaurant's name.", + "target_collection": "Restaurants", + "search_query": "Find restaurants that offer a romantic ambiance and Italian cuisine", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that offer a romantic ambiance and Italian cuisine, ensure they are open now, calculate the average rating, and organize the results by each restaurant's name.", + "target_collection": "Restaurants", + "search_query": "romantic ambiance Italian cuisine", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 17, + "database_schema_index": 0, + "natural_language_query": "Find cozy Italian restaurants with a great wine selection that are open now, and calculate the average rating of these open restaurants.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find cozy Italian restaurants with a great wine selection that are open now, and calculate the average rating of these open restaurants.", + "target_collection": "Restaurants", + "search_query": "Looking for cozy Italian restaurants with a great wine selection", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find cozy Italian restaurants with a great wine selection that are open now, and calculate the average rating of these open restaurants.", + "target_collection": "Restaurants", + "search_query": "cozy Italian restaurants with a great wine selection", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 18, + "database_schema_index": 0, + "natural_language_query": "What are the romantic Italian restaurants that are currently open now, and what is the most common description among them, grouped by their name?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What are the romantic Italian restaurants that are currently open now, and what is the most common description among them, grouped by their name?", + "target_collection": "Restaurants", + "search_query": "Find restaurants matching 'romantic Italian dining'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the romantic Italian restaurants that are currently open now, and what is the most common description among them, grouped by their name?", + "target_collection": "Restaurants", + "search_query": "romantic Italian restaurants", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 19, + "database_schema_index": 0, + "natural_language_query": "Find restaurants offering Mediterranean cuisine with a cozy ambiance and are currently open, then list the top 5 most common restaurant names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants offering Mediterranean cuisine with a cozy ambiance and are currently open, then list the top 5 most common restaurant names.", + "target_collection": "Restaurants", + "search_query": "Explore Mediterranean cuisine with a cozy ambiance", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants offering Mediterranean cuisine with a cozy ambiance and are currently open, then list the top 5 most common restaurant names.", + "target_collection": "Restaurants", + "search_query": "Mediterranean cuisine cozy ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 20, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that are known for their cozy ambiance and Italian cuisine, filter those that are currently open, aggregate to count how many are open versus closed, and organize results by the name of the restaurant.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that are known for their cozy ambiance and Italian cuisine, filter those that are currently open, aggregate to count how many are open versus closed, and organize results by the name of the restaurant.", + "target_collection": "Restaurants", + "search_query": "Find restaurants that are known for their cozy ambiance and Italian cuisine.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that are known for their cozy ambiance and Italian cuisine, filter those that are currently open, aggregate to count how many are open versus closed, and organize results by the name of the restaurant.", + "target_collection": "Restaurants", + "search_query": "cozy ambiance Italian cuisine", + "limit": 5, + "integer_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": 1 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 21, + "database_schema_index": 0, + "natural_language_query": "Find restaurants serving Italian cuisine with a romantic ambiance that are currently open, and calculate the percentage of restaurants that are open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants serving Italian cuisine with a romantic ambiance that are currently open, and calculate the percentage of restaurants that are open.", + "target_collection": "Restaurants", + "search_query": "Find restaurants serving Italian cuisine with a romantic ambiance", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants serving Italian cuisine with a romantic ambiance that are currently open, and calculate the percentage of restaurants that are open.", + "target_collection": "Restaurants", + "search_query": "romantic ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description.cuisine", + "operator": "=", + "value": "Italian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 22, + "database_schema_index": 0, + "natural_language_query": "Find cozy Italian restaurants that are currently open, and group them by their name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find cozy Italian restaurants that are currently open, and group them by their name.", + "target_collection": "Restaurants", + "search_query": "Find cozy Italian restaurants", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find cozy Italian restaurants that are currently open, and group them by their name.", + "target_collection": "Restaurants", + "search_query": "cozy Italian restaurants", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 23, + "database_schema_index": 0, + "natural_language_query": "Find currently open restaurants that conceptually relate to 'Italian cuisine with a cozy ambiance.'", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find currently open restaurants that conceptually relate to 'Italian cuisine with a cozy ambiance.'", + "target_collection": "Restaurants", + "search_query": "Find restaurants serving Italian cuisine with a cozy ambiance", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find currently open restaurants that conceptually relate to 'Italian cuisine with a cozy ambiance.'", + "target_collection": "Restaurants", + "search_query": "Italian cuisine with a cozy ambiance", + "limit": 5, + "integer_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": 1 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "description.cuisine", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 24, + "database_schema_index": 0, + "natural_language_query": "What are the total party sizes of reservations that mention 'birthday' in notes, grouped by whether the reservation is confirmed?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What are the total party sizes of reservations that mention 'birthday' in notes, grouped by whether the reservation is confirmed?", + "target_collection": "Reservations", + "search_query": "Find reservations where the notes mention 'birthday'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "confirmed" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the total party sizes of reservations that mention 'birthday' in notes, grouped by whether the reservation is confirmed?", + "target_collection": "Reservations", + "search_query": "birthday", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "confirmed", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "confirmed", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 25, + "database_schema_index": 0, + "natural_language_query": "What is the average price of spicy vegetarian menu items?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What is the average price of spicy vegetarian menu items?", + "target_collection": "Menus", + "search_query": "Find menu items with a description that matches 'spicy vegetarian options'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "price", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average price of spicy vegetarian menu items?", + "target_collection": "MenuItems", + "search_query": "spicy vegetarian", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "price", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 26, + "database_schema_index": 0, + "natural_language_query": "Identify romantic restaurants by analyzing descriptions for ambiance, count the number of unique restaurants, and group the results by whether they are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Identify romantic restaurants by analyzing descriptions for ambiance, count the number of unique restaurants, and group the results by whether they are currently open.", + "target_collection": "Restaurants", + "search_query": "Find restaurants that offer a romantic ambiance.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 27, + "database_schema_index": 0, + "natural_language_query": "Identify how many unique restaurants offer a cozy Italian cuisine with a romantic ambiance by analyzing their descriptions and count the occurrences of different restaurant names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Identify how many unique restaurants offer a cozy Italian cuisine with a romantic ambiance by analyzing their descriptions and count the occurrences of different restaurant names.", + "target_collection": "Restaurants", + "search_query": "Find restaurants with a description that matches 'cozy Italian cuisine with romantic ambiance'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='TOP_OCCURRENCES', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 28, + "database_schema_index": 0, + "natural_language_query": "What percentage of restaurants that offer outdoor seating and live music are currently open, and how are they distributed by their average rating?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What percentage of restaurants that offer outdoor seating and live music are currently open, and how are they distributed by their average rating?", + "target_collection": "Restaurants", + "search_query": "Find restaurants that offer outdoor seating and live music.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "What percentage of restaurants that offer outdoor seating and live music are currently open, and how are they distributed by their average rating?", + "target_collection": "Restaurants", + "search_query": "outdoor seating live music", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 29, + "database_schema_index": 0, + "natural_language_query": "What percentage of confirmed reservations mention the word 'celebration' in the notes?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What percentage of confirmed reservations mention the word 'celebration' in the notes?", + "target_collection": "Reservations", + "search_query": "celebration", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "confirmed", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='PERCENTAGE_TRUE', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 30, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine in their description using search_query, and then group these restaurants by their averageRating.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine in their description using search_query, and then group these restaurants by their averageRating.", + "target_collection": "Restaurants", + "search_query": "restaurants with a cozy ambiance and Italian cuisine", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine in their description using search_query, and then group these restaurants by their averageRating.", + "target_collection": "Restaurants", + "search_query": "cozy ambiance Italian cuisine", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 31, + "database_schema_index": 0, + "natural_language_query": "Find restaurants described as having a cozy ambiance in their detailed description.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants described as having a cozy ambiance in their detailed description.", + "target_collection": "Restaurants", + "search_query": "{\"query\":\"Find restaurants with cozy ambiance.\"}", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants described as having a cozy ambiance in their detailed description.", + "target_collection": "Restaurants", + "search_query": "cozy ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 32, + "database_schema_index": 0, + "natural_language_query": "Find reservations where the partySize is greater than 4, group the results by reservationName, and calculate the average partySize for each reservationName group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find reservations where the partySize is greater than 4, group the results by reservationName, and calculate the average partySize for each reservationName group.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find reservations where the partySize is greater than 4, group the results by reservationName, and calculate the average partySize for each reservationName group.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 33, + "database_schema_index": 0, + "natural_language_query": "Find how many reservations have a partySize of at least 4 people and provide the total count.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find how many reservations have a partySize of at least 4 people and provide the total count.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 34, + "database_schema_index": 0, + "natural_language_query": "Show all reservations with a partySize of at least 5 people, count how many times each reservationName occurs, and group the results by whether the reservation is confirmed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Show all reservations with a partySize of at least 5 people, count how many times each reservationName occurs, and group the results by whether the reservation is confirmed.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "confirmed" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show all reservations with a partySize of at least 5 people, count how many times each reservationName occurs, and group the results by whether the reservation is confirmed.", + "target_collection": "Reservations", + "search_query": "reservations with a partySize of at least 5 people", + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "reservationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": { + "property_name": "confirmed", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "confirmed", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 35, + "database_schema_index": 0, + "natural_language_query": "Find all menu items with a price less than $20 and determine the top 3 most common menuItem names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find all menu items with a price less than $20 and determine the top 3 most common menuItem names.", + "target_collection": "Menus", + "search_query": null, + "integer_property_filter": { + "property_name": "price", + "operator": "<", + "value": 20.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "menuItem", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all menu items with a price less than $20 and determine the top 3 most common menuItem names.", + "target_collection": "MenuItems", + "search_query": "", + "limit": 5, + "integer_property_filter": { + "property_name": "price", + "operator": "<", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "menuItem", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 36, + "database_schema_index": 0, + "natural_language_query": "Find reservations that have at least 5 people in partySize, aggregate them by counting the number of true values in the confirmed status, and group the results by reservationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find reservations that have at least 5 people in partySize, aggregate them by counting the number of true values in the confirmed status, and group the results by reservationName.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find reservations that have at least 5 people in partySize, aggregate them by counting the number of true values in the confirmed status, and group the results by reservationName.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "confirmed", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "reservationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 37, + "database_schema_index": 0, + "natural_language_query": "Find all reservations where there are more than 4 people in the partySize and count how many of these reservations are confirmed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find all reservations where there are more than 4 people in the partySize and count how many of these reservations are confirmed.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all reservations where there are more than 4 people in the partySize and count how many of these reservations are confirmed.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "confirmed", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 38, + "database_schema_index": 0, + "natural_language_query": "Find reservations where the partySize is at least 4 and group the results by whether the reservation is confirmed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find reservations where the partySize is at least 4 and group the results by whether the reservation is confirmed.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "confirmed" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find reservations where the partySize is at least 4 and group the results by whether the reservation is confirmed.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isConfirmed", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "isConfirmed", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 39, + "database_schema_index": 0, + "natural_language_query": "Find all reservations with a partySize that is at least 5", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find all reservations with a partySize that is at least 5", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all reservations with a partySize that is at least 5", + "target_collection": "Reservations", + "search_query": "reservations", + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 40, + "database_schema_index": 0, + "natural_language_query": "Find Italian restaurants by filtering descriptions that contain the word 'Italian', then calculate the average rating of these restaurants, and group results by whether they are currently open now.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find Italian restaurants by filtering descriptions that contain the word 'Italian', then calculate the average rating of these restaurants, and group results by whether they are currently open now.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "Italian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find Italian restaurants by filtering descriptions that contain the word 'Italian', then calculate the average rating of these restaurants, and group results by whether they are currently open now.", + "target_collection": "Restaurants", + "search_query": "Italian", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 41, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with the word 'vegan' in their description and count how many such restaurants exist.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with the word 'vegan' in their description and count how many such restaurants exist.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "%vegan%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 42, + "database_schema_index": 0, + "natural_language_query": "Retrieve the count of restaurants containing 'Italian' in the description, group them by the openNow status, and provide the count of each restaurant name within those groups.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Retrieve the count of restaurants containing 'Italian' in the description, group them by the openNow status, and provide the count of each restaurant name within those groups.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "%Italian%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 43, + "database_schema_index": 0, + "natural_language_query": "Find menu items with descriptions containing the word 'spicy' and determine the top three most common item names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find menu items with descriptions containing the word 'spicy' and determine the top three most common item names.", + "target_collection": "Menus", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "itemDescription", + "operator": "LIKE", + "value": "spicy" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "menuItem", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find menu items with descriptions containing the word 'spicy' and determine the top three most common item names.", + "target_collection": "MenuItems", + "search_query": "spicy", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "itemName", + "metrics": "SUM" + }, + "text_property_aggregation": { + "property_name": "itemName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 44, + "database_schema_index": 0, + "natural_language_query": "Find reservations that mention 'birthday' in their notes, count how many of these reservations are confirmed, and group the results by the name under which each reservation is made.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find reservations that mention 'birthday' in their notes, count how many of these reservations are confirmed, and group the results by the name under which each reservation is made.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "notes", + "operator": "LIKE", + "value": "%birthday%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find reservations that mention 'birthday' in their notes, count how many of these reservations are confirmed, and group the results by the name under which each reservation is made.", + "target_collection": "Reservations", + "search_query": "birthday", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "status", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 45, + "database_schema_index": 0, + "natural_language_query": "Find all restaurants that mention 'vegan' in their description and count how many are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find all restaurants that mention 'vegan' in their description and count how many are currently open.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "vegan" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all restaurants that mention 'vegan' in their description and count how many are currently open.", + "target_collection": "Restaurants", + "search_query": "vegan", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 46, + "database_schema_index": 0, + "natural_language_query": "Find restaurants where the description contains 'Italian cuisine' and group these results by their name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants where the description contains 'Italian cuisine' and group these results by their name.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "Italian cuisine" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "3 validation errors for IntPropertyFilter\nproperty_name\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\noperator\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\nvalue\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing" + }, + { + "query_index": 47, + "database_schema_index": 0, + "natural_language_query": "Find restaurants in the Restaurants collection where the description contains the keyword 'Italian'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants in the Restaurants collection where the description contains the keyword 'Italian'.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "Italian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "3 validation errors for IntPropertyFilter\nproperty_name\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\noperator\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\nvalue\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing" + }, + { + "query_index": 48, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that are currently open, group them by their averageRating, and calculate the mean averageRating for each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that are currently open, group them by their averageRating, and calculate the mean averageRating for each group.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that are currently open, group them by their averageRating, and calculate the mean averageRating for each group.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 49, + "database_schema_index": 0, + "natural_language_query": "Determine the average rating of all restaurants that are open now, filtering by the openNow property, and calculate the mean on the averageRating property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Determine the average rating of all restaurants that are open now, filtering by the openNow property, and calculate the mean on the averageRating property.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Determine the average rating of all restaurants that are open now, filtering by the openNow property, and calculate the mean on the averageRating property.", + "target_collection": "Restaurants", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 50, + "database_schema_index": 0, + "natural_language_query": "What types of cuisines are available in restaurants that are currently open, grouped by their average rating?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What types of cuisines are available in restaurants that are currently open, grouped by their average rating?", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "What types of cuisines are available in restaurants that are currently open, grouped by their average rating?", + "target_collection": "Restaurants", + "search_query": "types of cuisines", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "description.cuisine", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + }, + { + "query_index": 51, + "database_schema_index": 0, + "natural_language_query": "Identify the most common cuisine type among all restaurants that are currently open (using 'openNow' property for filtering and 'description' property for text aggregation).", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Identify the most common cuisine type among all restaurants that are currently open (using 'openNow' property for filtering and 'description' property for text aggregation).", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify the most common cuisine type among all restaurants that are currently open (using 'openNow' property for filtering and 'description' property for text aggregation).", + "target_collection": "Restaurants", + "search_query": "most common cuisine type", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description.cuisine", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "description.cuisine", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.65, + "error": null + }, + { + "query_index": 52, + "database_schema_index": 0, + "natural_language_query": "Calculate the percentage of restaurants that are currently open (openNow = true), and group these open restaurants by their averageRating to understand how many are open in each rating category.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Calculate the percentage of restaurants that are currently open (openNow = true), and group these open restaurants by their averageRating to understand how many are open in each rating category.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate the percentage of restaurants that are currently open (openNow = true), and group these open restaurants by their averageRating to understand how many are open in each rating category.", + "target_collection": "Restaurants", + "search_query": "restaurants that are currently open", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": "=", + "value": 0 + }, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 53, + "database_schema_index": 0, + "natural_language_query": "Show me all confirmed reservations and count the total number of confirmed versus unconfirmed reservations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Show me all confirmed reservations and count the total number of confirmed versus unconfirmed reservations.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "confirmed", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Show me all confirmed reservations and count the total number of confirmed versus unconfirmed reservations.", + "target_collection": "Reservations", + "search_query": "confirmed reservations", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "isConfirmed", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isConfirmed", + "metrics": "TOTAL_FALSE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 54, + "database_schema_index": 0, + "natural_language_query": "Show all restaurants that are currently open (openNow = true), and group these by the type of cuisine mentioned in the description to see how many open restaurants exist for each cuisine type.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Show all restaurants that are currently open (openNow = true), and group these by the type of cuisine mentioned in the description to see how many open restaurants exist for each cuisine type.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "description" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show all restaurants that are currently open (openNow = true), and group these by the type of cuisine mentioned in the description to see how many open restaurants exist for each cuisine type.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "description.cuisine", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 55, + "database_schema_index": 0, + "natural_language_query": "Find restaurants where openNow is true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants where openNow is true.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants where openNow is true.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 56, + "database_schema_index": 0, + "natural_language_query": "Find the total party size for reservations grouped by reservationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find the total party size for reservations grouped by reservationName.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the total party size for reservations grouped by reservationName.", + "target_collection": "Reservations", + "search_query": "total party size", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 57, + "database_schema_index": 0, + "natural_language_query": "Count the number of reservations based on their partySize.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Count the number of reservations based on their partySize.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Count the number of reservations based on their partySize.", + "target_collection": "Reservations", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 58, + "database_schema_index": 0, + "natural_language_query": "Find the types of cuisines mentioned most frequently in the restaurant descriptions, grouped by whether the restaurants are currently open or closed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find the types of cuisines mentioned most frequently in the restaurant descriptions, grouped by whether the restaurants are currently open or closed.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the types of cuisines mentioned most frequently in the restaurant descriptions, grouped by whether the restaurants are currently open or closed.", + "target_collection": "Restaurants", + "search_query": "cuisines", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description.cuisine", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 59, + "database_schema_index": 0, + "natural_language_query": "What are the three most common phrases in the description of restaurants?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What are the three most common phrases in the description of restaurants?", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='TOP_OCCURRENCES', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 60, + "database_schema_index": 0, + "natural_language_query": "Calculate the percentage of restaurants that are open now within each grouping by their average rating.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Calculate the percentage of restaurants that are open now within each grouping by their average rating.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate the percentage of restaurants that are open now within each grouping by their average rating.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 61, + "database_schema_index": 0, + "natural_language_query": "Calculate the percentage of menu items that are vegetarian based on the isVegetarian property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Calculate the percentage of menu items that are vegetarian based on the isVegetarian property.", + "target_collection": "Menus", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isVegetarian", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate the percentage of menu items that are vegetarian based on the isVegetarian property.", + "target_collection": "MenuItems", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isVegetarian", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 62, + "database_schema_index": 0, + "natural_language_query": "Group restaurants by their averageRating to analyze patterns across different rating categories, helping to understand how many restaurants fall into each rating group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Group restaurants by their averageRating to analyze patterns across different rating categories, helping to understand how many restaurants fall into each rating group.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Group restaurants by their averageRating to analyze patterns across different rating categories, helping to understand how many restaurants fall into each rating group.", + "target_collection": "Restaurants", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 63, + "database_schema_index": 0, + "natural_language_query": "Identify clinics that specialize in pediatric care using semantic search, filter out only those with an averagePatientSatisfaction of 4.5 or higher, calculate the mean averagePatientSatisfaction, and group these results based on whether they are acceptingNewPatients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Identify clinics that specialize in pediatric care using semantic search, filter out only those with an averagePatientSatisfaction of 4.5 or higher, calculate the mean averagePatientSatisfaction, and group these results based on whether they are acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": "Find clinics that specialize in pediatric care", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify clinics that specialize in pediatric care using semantic search, filter out only those with an averagePatientSatisfaction of 4.5 or higher, calculate the mean averagePatientSatisfaction, and group these results based on whether they are acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": "clinics that specialize in pediatric care", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 64, + "database_schema_index": 1, + "natural_language_query": "Retrieve clinics with descriptions including 'comprehensive healthcare', having averagePatientSatisfaction greater than 4.5, and count how many of these clinics are acceptingNewPatients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Retrieve clinics with descriptions including 'comprehensive healthcare', having averagePatientSatisfaction greater than 4.5, and count how many of these clinics are acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": "Find clinics whose description includes comprehensive healthcare", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Retrieve clinics with descriptions including 'comprehensive healthcare', having averagePatientSatisfaction greater than 4.5, and count how many of these clinics are acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": "comprehensive healthcare", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 65, + "database_schema_index": 1, + "natural_language_query": "Find clinics related to cardiology with average patient satisfaction higher than 4. Resulting clinics should be grouped based on whether they are accepting new patients or not, and within each group, identify the top 5 most common service descriptions.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics related to cardiology with average patient satisfaction higher than 4. Resulting clinics should be grouped based on whether they are accepting new patients or not, and within each group, identify the top 5 most common service descriptions.", + "target_collection": "Clinics", + "search_query": "cardiology", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics related to cardiology with average patient satisfaction higher than 4. Resulting clinics should be grouped based on whether they are accepting new patients or not, and within each group, identify the top 5 most common service descriptions.", + "target_collection": "Clinics", + "search_query": "clinics related to cardiology", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "serviceDescription", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 66, + "database_schema_index": 1, + "natural_language_query": "Find doctors with expertise related to dermatology and skin care, who have at least 10 years of experience, and retrieve the top 3 most common doctor names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors with expertise related to dermatology and skin care, who have at least 10 years of experience, and retrieve the top 3 most common doctor names.", + "target_collection": "Doctors", + "search_query": "Find doctors with expertise related to dermatology and skin care", + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "doctorName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors with expertise related to dermatology and skin care, who have at least 10 years of experience, and retrieve the top 3 most common doctor names.", + "target_collection": "Doctors", + "search_query": "expertise related to dermatology and skin care", + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "doctorName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 67, + "database_schema_index": 1, + "natural_language_query": "Find clinics specialized in cardiovascular healthcare by searching \"description\"; filter these to only show clinics with an \"averagePatientSatisfaction\" greater than 4.5; determine the percentage of these clinics \"acceptingNewPatients\"; and finally, organize the results by \"clinicName\".", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics specialized in cardiovascular healthcare by searching \"description\"; filter these to only show clinics with an \"averagePatientSatisfaction\" greater than 4.5; determine the percentage of these clinics \"acceptingNewPatients\"; and finally, organize the results by \"clinicName\".", + "target_collection": "Clinics", + "search_query": "Find clinics that are specialized in cardiovascular healthcare.", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics specialized in cardiovascular healthcare by searching \"description\"; filter these to only show clinics with an \"averagePatientSatisfaction\" greater than 4.5; determine the percentage of these clinics \"acceptingNewPatients\"; and finally, organize the results by \"clinicName\".", + "target_collection": "Clinics", + "search_query": "cardiovascular healthcare", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 68, + "database_schema_index": 1, + "natural_language_query": "Find clinics offering pediatric services with an average patient satisfaction score greater than 4, and count the total number of clinics that are currently accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics offering pediatric services with an average patient satisfaction score greater than 4, and count the total number of clinics that are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "Find clinics offering pediatric services", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics offering pediatric services with an average patient satisfaction score greater than 4, and count the total number of clinics that are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "clinics offering pediatric services", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfactionScore", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "total", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.775, + "error": null + }, + { + "query_index": 69, + "database_schema_index": 1, + "natural_language_query": "Find doctors who specialize in neurology with more than 10 years of experience, and group the results by whether they are currently practicing or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors who specialize in neurology with more than 10 years of experience, and group the results by whether they are currently practicing or not.", + "target_collection": "Doctors", + "search_query": "Find doctors who specialize in neurology", + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors who specialize in neurology with more than 10 years of experience, and group the results by whether they are currently practicing or not.", + "target_collection": "Doctors", + "search_query": "doctors who specialize in neurology", + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyPracticing", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "currentlyPracticing", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 70, + "database_schema_index": 1, + "natural_language_query": "Find clinics with a description similar to 'pediatric care' that have an averagePatientSatisfaction score of at least 4.5.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics with a description similar to 'pediatric care' that have an averagePatientSatisfaction score of at least 4.5.", + "target_collection": "Clinics", + "search_query": "pediatric care", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics with a description similar to 'pediatric care' that have an averagePatientSatisfaction score of at least 4.5.", + "target_collection": "Clinics", + "search_query": "pediatric care", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 71, + "database_schema_index": 1, + "natural_language_query": "Identify clinics that offer dental services by performing a search for relevant specialties, filter specifically for a clinic named Sunny Clinic, determine the maximum average patient satisfaction score, and group the results based on whether they are accepting new patients or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Identify clinics that offer dental services by performing a search for relevant specialties, filter specifically for a clinic named Sunny Clinic, determine the maximum average patient satisfaction score, and group the results based on whether they are accepting new patients or not.", + "target_collection": "Clinics", + "search_query": "Find clinics that offer dental services and check their specialties", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "Sunny Clinic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify clinics that offer dental services by performing a search for relevant specialties, filter specifically for a clinic named Sunny Clinic, determine the maximum average patient satisfaction score, and group the results based on whether they are accepting new patients or not.", + "target_collection": "Clinics", + "search_query": "dental services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Sunny Clinic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfactionScore", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9, + "error": null + }, + { + "query_index": 72, + "database_schema_index": 1, + "natural_language_query": "Find clinics with a description similar to 'clinic with specialties in cardiology and pediatric care', where the clinicName is exactly 'City Health Center', and calculate the average of averagePatientSatisfaction for these clinics.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics with a description similar to 'clinic with specialties in cardiology and pediatric care', where the clinicName is exactly 'City Health Center', and calculate the average of averagePatientSatisfaction for these clinics.", + "target_collection": "Clinics", + "search_query": "clinic with specialties in cardiology and pediatric care", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "City Health Center" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics with a description similar to 'clinic with specialties in cardiology and pediatric care', where the clinicName is exactly 'City Health Center', and calculate the average of averagePatientSatisfaction for these clinics.", + "target_collection": "Clinics", + "search_query": "clinic with specialties in cardiology and pediatric care", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "City Health Center" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 73, + "database_schema_index": 1, + "natural_language_query": "Find clinics that offer family healthcare services using semantic search, and are accepting new patients. Count the number of unique clinics and group them by average patient satisfaction score.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that offer family healthcare services using semantic search, and are accepting new patients. Count the number of unique clinics and group them by average patient satisfaction score.", + "target_collection": "Clinics", + "search_query": "Family healthcare services", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 74, + "database_schema_index": 1, + "natural_language_query": "Find clinics that describe themselves as offering holistic healthcare services, filter those with 'Health' in their clinicName, and identify the top 3 most frequently occurring clinic names from those results.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that describe themselves as offering holistic healthcare services, filter those with 'Health' in their clinicName, and identify the top 3 most frequently occurring clinic names from those results.", + "target_collection": "Clinics", + "search_query": "Find clinics that offer holistic healthcare services based on detailed description", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "LIKE", + "value": "%Health%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "clinicName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "3 validation errors for IntPropertyFilter\nproperty_name\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\noperator\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\nvalue\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing" + }, + { + "query_index": 75, + "database_schema_index": 1, + "natural_language_query": "Find the best clinics known for pediatric services, where clinic names start with 'A', group them by average patient satisfaction, and count how many are accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find the best clinics known for pediatric services, where clinic names start with 'A', group them by average patient satisfaction, and count how many are accepting new patients.", + "target_collection": "Clinics", + "search_query": "Find the best clinics known for pediatric services", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "LIKE", + "value": "A%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the best clinics known for pediatric services, where clinic names start with 'A', group them by average patient satisfaction, and count how many are accepting new patients.", + "target_collection": "Clinics", + "search_query": "best clinics known for pediatric services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "A%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 76, + "database_schema_index": 1, + "natural_language_query": "Find appointments related to annual health check-ups by searching in appointmentNotes for 'check-up', and count how many of these appointments are confirmed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find appointments related to annual health check-ups by searching in appointmentNotes for 'check-up', and count how many of these appointments are confirmed.", + "target_collection": "Appointments", + "search_query": "Find the appointments that are relevant to annual health check-ups", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "appointmentNotes", + "operator": "LIKE", + "value": "check-up" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find appointments related to annual health check-ups by searching in appointmentNotes for 'check-up', and count how many of these appointments are confirmed.", + "target_collection": "Appointments", + "search_query": "check-up", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "confirmed", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 77, + "database_schema_index": 1, + "natural_language_query": "Search for clinics that have descriptions mentioning advanced medical technology, filter by the clinic name \"Healthcare Plus Clinic\", and group the results by whether they are accepting new patients, aggregating average patient satisfaction scores within each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Search for clinics that have descriptions mentioning advanced medical technology, filter by the clinic name \"Healthcare Plus Clinic\", and group the results by whether they are accepting new patients, aggregating average patient satisfaction scores within each group.", + "target_collection": "Clinics", + "search_query": "Find clinics whose description includes advanced medical technology.", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "Healthcare Plus Clinic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for clinics that have descriptions mentioning advanced medical technology, filter by the clinic name \"Healthcare Plus Clinic\", and group the results by whether they are accepting new patients, aggregating average patient satisfaction scores within each group.", + "target_collection": "Clinics", + "search_query": "advanced medical technology", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Healthcare Plus Clinic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfactionScore", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 78, + "database_schema_index": 1, + "natural_language_query": "Search for clinics whose description indicates a focus on comprehensive dermatology services and skin care treatments, and filter to include only those clinics with 'Dermatology' in their clinicName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Search for clinics whose description indicates a focus on comprehensive dermatology services and skin care treatments, and filter to include only those clinics with 'Dermatology' in their clinicName.", + "target_collection": "Clinics", + "search_query": "Find clinics that provide comprehensive dermatology services and skin care treatments", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "LIKE", + "value": "*Dermatology*" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for clinics whose description indicates a focus on comprehensive dermatology services and skin care treatments, and filter to include only those clinics with 'Dermatology' in their clinicName.", + "target_collection": "Clinics", + "search_query": "comprehensive dermatology services and skin care treatments", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "LIKE", + "value": "Dermatology" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "description.cuisine", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 79, + "database_schema_index": 1, + "natural_language_query": "Find clinics based on a high patient satisfaction, filter to include only those currently accepting new patients, perform an average calculation of the averagePatientSatisfaction, and group the results by clinic name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics based on a high patient satisfaction, filter to include only those currently accepting new patients, perform an average calculation of the averagePatientSatisfaction, and group the results by clinic name.", + "target_collection": "Clinics", + "search_query": "high patient satisfaction", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics based on a high patient satisfaction, filter to include only those currently accepting new patients, perform an average calculation of the averagePatientSatisfaction, and group the results by clinic name.", + "target_collection": "Clinics", + "search_query": "clinics based on a high patient satisfaction", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 80, + "database_schema_index": 1, + "natural_language_query": "Find clinics that are conceptually related to pediatrics, are accepting new patients, and calculate the mean average patient satisfaction score across all such clinics.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that are conceptually related to pediatrics, are accepting new patients, and calculate the mean average patient satisfaction score across all such clinics.", + "target_collection": "Clinics", + "search_query": "pediatrics", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that are conceptually related to pediatrics, are accepting new patients, and calculate the mean average patient satisfaction score across all such clinics.", + "target_collection": "Clinics", + "search_query": "clinics that are conceptually related to pediatrics", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "patientSatisfactionScore", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 81, + "database_schema_index": 1, + "natural_language_query": "Find doctors with expertise in cardiology who are currently practicing, show how many doctors there are per expertise, and group them by their expertise category.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors with expertise in cardiology who are currently practicing, show how many doctors there are per expertise, and group them by their expertise category.", + "target_collection": "Doctors", + "search_query": "Find doctors with expertise in 'cardiology'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyPracticing", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "expertise" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors with expertise in cardiology who are currently practicing, show how many doctors there are per expertise, and group them by their expertise category.", + "target_collection": "Doctors", + "search_query": "doctors with expertise in cardiology", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyPracticing", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "expertiseCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "expertiseCategory", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 82, + "database_schema_index": 1, + "natural_language_query": "Find clinics that match specific healthcare needs and services, filter to show only those accepting new patients, and aggregate to find the top 5 most common descriptions of these clinics.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that match specific healthcare needs and services, filter to show only those accepting new patients, and aggregate to find the top 5 most common descriptions of these clinics.", + "target_collection": "Clinics", + "search_query": "Find clinics that provide specialties or services mentioned in the search", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that match specific healthcare needs and services, filter to show only those accepting new patients, and aggregate to find the top 5 most common descriptions of these clinics.", + "target_collection": "Clinics", + "search_query": "clinics that match specific healthcare needs and services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 83, + "database_schema_index": 1, + "natural_language_query": "Identify clinics that provide cardiology services (using descriptions for search), determine which of them are currently accepting new patients, and count the number of clinics within each range of average patient satisfaction scores.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Identify clinics that provide cardiology services (using descriptions for search), determine which of them are currently accepting new patients, and count the number of clinics within each range of average patient satisfaction scores.", + "target_collection": "Clinics", + "search_query": "Find clinics offering cardiology services", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 84, + "database_schema_index": 1, + "natural_language_query": "Find clinics that match the concept of 'family healthcare services', filter those that are accepting new patients, and calculate the percentage of clinics that are accepting new patients among the total results.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that match the concept of 'family healthcare services', filter those that are accepting new patients, and calculate the percentage of clinics that are accepting new patients among the total results.", + "target_collection": "Clinics", + "search_query": "Find clinics that match the concept of 'family healthcare services'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that match the concept of 'family healthcare services', filter those that are accepting new patients, and calculate the percentage of clinics that are accepting new patients among the total results.", + "target_collection": "Clinics", + "search_query": "family healthcare services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 85, + "database_schema_index": 1, + "natural_language_query": "Find clinics that specialize in pediatric care and are accepting new patients, then group the results by their average patient satisfaction score.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that specialize in pediatric care and are accepting new patients, then group the results by their average patient satisfaction score.", + "target_collection": "Clinics", + "search_query": "Find clinics that specialize in pediatric care", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that specialize in pediatric care and are accepting new patients, then group the results by their average patient satisfaction score.", + "target_collection": "Clinics", + "search_query": "clinics that specialize in pediatric care", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfactionScore", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfactionScore", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 86, + "database_schema_index": 1, + "natural_language_query": "Find clinics that specialize in cardiac care based on their description and are currently accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that specialize in cardiac care based on their description and are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "Find clinics that specialize in cardiac care based on their description", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that specialize in cardiac care based on their description and are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "clinics that specialize in cardiac care", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 87, + "database_schema_index": 1, + "natural_language_query": "List clinics that provide excellent healthcare services. Within these clinics, group them by their clinic names and count how many are currently accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "List clinics that provide excellent healthcare services. Within these clinics, group them by their clinic names and count how many are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "Find clinics that match the description of providing excellent healthcare services with high specialties", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "List clinics that provide excellent healthcare services. Within these clinics, group them by their clinic names and count how many are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "excellent healthcare services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 88, + "database_schema_index": 1, + "natural_language_query": "Find doctors in the Doctors collection specializing in 'cardiology' based on their expertise property, and calculate the mean yearsOfExperience for these doctors.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors in the Doctors collection specializing in 'cardiology' based on their expertise property, and calculate the mean yearsOfExperience for these doctors.", + "target_collection": "Doctors", + "search_query": "Find doctors specializing in cardiology", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors in the Doctors collection specializing in 'cardiology' based on their expertise property, and calculate the mean yearsOfExperience for these doctors.", + "target_collection": "Doctors", + "search_query": "cardiology", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 89, + "database_schema_index": 1, + "natural_language_query": "Find clinics that provide 'dental services', group them by whether they are accepting new patients, and count how many clinics are in each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that provide 'dental services', group them by whether they are accepting new patients, and count how many clinics are in each group.", + "target_collection": "Clinics", + "search_query": "Find clinics providing 'dental services'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that provide 'dental services', group them by whether they are accepting new patients, and count how many clinics are in each group.", + "target_collection": "Clinics", + "search_query": "dental services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "total_count", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 90, + "database_schema_index": 1, + "natural_language_query": "Find clinics offering high-quality healthcare services based on their description, and count the number of unique clinic names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics offering high-quality healthcare services based on their description, and count the number of unique clinic names.", + "target_collection": "Clinics", + "search_query": "High-quality healthcare services", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 91, + "database_schema_index": 1, + "natural_language_query": "Search for clinics where the description mentions specific healthcare services you need, determine what percentage of these clinics are accepting new patients, and group the results by clinicName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Search for clinics where the description mentions specific healthcare services you need, determine what percentage of these clinics are accepting new patients, and group the results by clinicName.", + "target_collection": "Clinics", + "search_query": "Find clinics with descriptions similar to healthcare services or specialties you need", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for clinics where the description mentions specific healthcare services you need, determine what percentage of these clinics are accepting new patients, and group the results by clinicName.", + "target_collection": "Clinics", + "search_query": "specific healthcare services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 92, + "database_schema_index": 1, + "natural_language_query": "How many clinics that offer pediatrics and family healthcare are currently accepting new patients?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "How many clinics that offer pediatrics and family healthcare are currently accepting new patients?", + "target_collection": "Clinics", + "search_query": "Find clinics that offer pediatrics and family healthcare", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "How many clinics that offer pediatrics and family healthcare are currently accepting new patients?", + "target_collection": "Clinics", + "search_query": "clinics that offer pediatrics and family healthcare", + "limit": 5, + "integer_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": 1 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 93, + "database_schema_index": 1, + "natural_language_query": "Find clinics that specialize in pediatric services, offer state-of-the-art facilities, and have high ratings for patient care experience, and then group these clinics based on whether they are accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that specialize in pediatric services, offer state-of-the-art facilities, and have high ratings for patient care experience, and then group these clinics based on whether they are accepting new patients.", + "target_collection": "Clinics", + "search_query": "Find clinics that specialize in pediatric services, offer state-of-the-art facilities, and have high ratings for patient care experience", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that specialize in pediatric services, offer state-of-the-art facilities, and have high ratings for patient care experience, and then group these clinics based on whether they are accepting new patients.", + "target_collection": "Clinics", + "search_query": "clinics that specialize in pediatric services, offer state-of-the-art facilities, and have high ratings for patient care experience", + "limit": 5, + "integer_property_filter": { + "property_name": "patientCareExperienceRating", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 94, + "database_schema_index": 1, + "natural_language_query": "What clinics are recognized for their exceptional orthopedic services and a high emphasis on patient care?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "What clinics are recognized for their exceptional orthopedic services and a high emphasis on patient care?", + "target_collection": "Clinics", + "search_query": "Find clinics that are renowned for exceptional orthopedic services and have a high focus on patient care.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What clinics are recognized for their exceptional orthopedic services and a high emphasis on patient care?", + "target_collection": "Clinics", + "search_query": "exceptional orthopedic services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "patientCareEmphasis", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 95, + "database_schema_index": 1, + "natural_language_query": "Find doctors with more than 10 yearsOfExperience, calculate the average yearsOfExperience for these doctors, and group the results by whether they are currentlyPracticing or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors with more than 10 yearsOfExperience, calculate the average yearsOfExperience for these doctors, and group the results by whether they are currentlyPracticing or not.", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors with more than 10 yearsOfExperience, calculate the average yearsOfExperience for these doctors, and group the results by whether they are currentlyPracticing or not.", + "target_collection": "Doctors", + "search_query": "doctors with more than 10 yearsOfExperience", + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 96, + "database_schema_index": 1, + "natural_language_query": "Find the number of clinics where the averagePatientSatisfaction score is at least 4.5", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find the number of clinics where the averagePatientSatisfaction score is at least 4.5", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the number of clinics where the averagePatientSatisfaction score is at least 4.5", + "target_collection": "Clinics", + "search_query": "clinics", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 97, + "database_schema_index": 1, + "natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5, then group results by acceptingNewPatients status and determine the top 3 most common specialties within each group's description.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5, then group results by acceptingNewPatients status and determine the top 3 most common specialties within each group's description.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5, then group results by acceptingNewPatients status and determine the top 3 most common specialties within each group's description.", + "target_collection": "Clinics", + "search_query": "clinics where the averagePatientSatisfaction is at least 4.5", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description.specialty", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 98, + "database_schema_index": 1, + "natural_language_query": "Find appointments that have an appointmentDuration of at least 30 minutes and determine the most common patientName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find appointments that have an appointmentDuration of at least 30 minutes and determine the most common patientName.", + "target_collection": "Appointments", + "search_query": null, + "integer_property_filter": { + "property_name": "appointmentDuration", + "operator": ">=", + "value": 30 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "patientName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find appointments that have an appointmentDuration of at least 30 minutes and determine the most common patientName.", + "target_collection": "Appointments", + "search_query": "appointments that have an appointmentDuration of at least 30 minutes", + "limit": 5, + "integer_property_filter": { + "property_name": "appointmentDuration", + "operator": ">=", + "value": 30 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "patientName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 99, + "database_schema_index": 1, + "natural_language_query": "Group clinics by their clinicName, but only include those with an averagePatientSatisfaction of at least 4.5, and count how many of these clinics are currently accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Group clinics by their clinicName, but only include those with an averagePatientSatisfaction of at least 4.5, and count how many of these clinics are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Group clinics by their clinicName, but only include those with an averagePatientSatisfaction of at least 4.5, and count how many of these clinics are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 100, + "database_schema_index": 1, + "natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5 and count how many of these clinics are currently acceptingNewPatients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5 and count how many of these clinics are currently acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 101, + "database_schema_index": 1, + "natural_language_query": "Find doctors with at least 10 years of experience and group results by whether they are currently practicing.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors with at least 10 years of experience and group results by whether they are currently practicing.", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors with at least 10 years of experience and group results by whether they are currently practicing.", + "target_collection": "Doctors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 102, + "database_schema_index": 1, + "natural_language_query": "Find doctors who have more than 10 years in yearsOfExperience", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors who have more than 10 years in yearsOfExperience", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors who have more than 10 years in yearsOfExperience", + "target_collection": "Doctors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 103, + "database_schema_index": 1, + "natural_language_query": "Find all clinics where the description contains the keyword 'specialty', group them by their acceptingNewPatients status, and calculate the maximum averagePatientSatisfaction score for each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find all clinics where the description contains the keyword 'specialty', group them by their acceptingNewPatients status, and calculate the maximum averagePatientSatisfaction score for each group.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "specialty" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all clinics where the description contains the keyword 'specialty', group them by their acceptingNewPatients status, and calculate the maximum averagePatientSatisfaction score for each group.", + "target_collection": "Clinics", + "search_query": "specialty", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 104, + "database_schema_index": 1, + "natural_language_query": "How many appointments have the word 'consultation' in their appointmentNotes and what is their total count for appointmentDuration?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "How many appointments have the word 'consultation' in their appointmentNotes and what is their total count for appointmentDuration?", + "target_collection": "Appointments", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "appointmentNotes", + "operator": "LIKE", + "value": "consultation" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 105, + "database_schema_index": 1, + "natural_language_query": "Identify how many different averagePatientSatisfaction scores exist for clinics whose description includes the term 'multispecialty', grouped by the description property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Identify how many different averagePatientSatisfaction scores exist for clinics whose description includes the term 'multispecialty', grouped by the description property.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "multispecialty" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "description" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 106, + "database_schema_index": 1, + "natural_language_query": "Find the number of unique clinicName values from the Clinics collection where the description contains the word 'dental' by counting these occurrences.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find the number of unique clinicName values from the Clinics collection where the description contains the word 'dental' by counting these occurrences.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "%dental%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 107, + "database_schema_index": 1, + "natural_language_query": "Show the percentage of clinics accepting new patients, grouped by clinicName, where the clinic's description contains the word pediatrics.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Show the percentage of clinics accepting new patients, grouped by clinicName, where the clinic's description contains the word pediatrics.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "pediatrics" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show the percentage of clinics accepting new patients, grouped by clinicName, where the clinic's description contains the word pediatrics.", + "target_collection": "Clinics", + "search_query": "pediatrics", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 108, + "database_schema_index": 1, + "natural_language_query": "Find clinics where the description includes 'cancer', and determine how many of these clinics are accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics where the description includes 'cancer', and determine how many of these clinics are accepting new patients.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "%cancer%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics where the description includes 'cancer', and determine how many of these clinics are accepting new patients.", + "target_collection": "Clinics", + "search_query": "cancer", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "total_count", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.775, + "error": null + }, + { + "query_index": 109, + "database_schema_index": 1, + "natural_language_query": "Find clinics that have 'pediatrics' in their description, and group them by whether they are accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that have 'pediatrics' in their description, and group them by whether they are accepting new patients.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "pediatrics" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that have 'pediatrics' in their description, and group them by whether they are accepting new patients.", + "target_collection": "Clinics", + "search_query": "pediatrics", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 110, + "database_schema_index": 1, + "natural_language_query": "Retrieve the clinic that has the exact clinicName 'Community HealthCare Center'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Retrieve the clinic that has the exact clinicName 'Community HealthCare Center'.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "Community HealthCare Center" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "3 validation errors for IntPropertyFilter\nproperty_name\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\noperator\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\nvalue\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing" + }, + { + "query_index": 111, + "database_schema_index": 1, + "natural_language_query": "For clinics that are accepting new patients, calculate the mean averagePatientSatisfaction score for each category described by 'description'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "For clinics that are accepting new patients, calculate the mean averagePatientSatisfaction score for each category described by 'description'.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "description" + }, + "predicted_query": { + "corresponding_natural_language_query": "For clinics that are accepting new patients, calculate the mean averagePatientSatisfaction score for each category described by 'description'.", + "target_collection": "Clinics", + "search_query": "clinics that are accepting new patients", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "description", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 112, + "database_schema_index": 1, + "natural_language_query": "Find clinics that are accepting new patients and calculate the mean of averagePatientSatisfaction scores for those clinics.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that are accepting new patients and calculate the mean of averagePatientSatisfaction scores for those clinics.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that are accepting new patients and calculate the mean of averagePatientSatisfaction scores for those clinics.", + "target_collection": "Clinics", + "search_query": "clinics that are accepting new patients", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 113, + "database_schema_index": 1, + "natural_language_query": "Find clinics that are accepting new patients (using 'acceptingNewPatients' with true value), group the results by clinicName, and aggregate to count the occurrences of each clinic name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that are accepting new patients (using 'acceptingNewPatients' with true value), group the results by clinicName, and aggregate to count the occurrences of each clinic name.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that are accepting new patients (using 'acceptingNewPatients' with true value), group the results by clinicName, and aggregate to count the occurrences of each clinic name.", + "target_collection": "Clinics", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "clinicName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 114, + "database_schema_index": 1, + "natural_language_query": "Find all clinics where acceptingNewPatients is true, and count how many different clinics share the same description.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find all clinics where acceptingNewPatients is true, and count how many different clinics share the same description.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all clinics where acceptingNewPatients is true, and count how many different clinics share the same description.", + "target_collection": "Clinics", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "description", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + }, + { + "query_index": 115, + "database_schema_index": 1, + "natural_language_query": "Find and display the percentage of clinics that are currently accepting new patients, grouped by each clinic's name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find and display the percentage of clinics that are currently accepting new patients, grouped by each clinic's name.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find and display the percentage of clinics that are currently accepting new patients, grouped by each clinic's name.", + "target_collection": "Clinics", + "search_query": "clinics that are currently accepting new patients", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + }, + { + "query_index": 116, + "database_schema_index": 1, + "natural_language_query": "Find all appointments where appointmentConfirmed is false and also count the total number of appointments based on appointmentConfirmed status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find all appointments where appointmentConfirmed is false and also count the total number of appointments based on appointmentConfirmed status.", + "target_collection": "Appointments", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "appointmentConfirmed", + "operator": "=", + "value": false + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all appointments where appointmentConfirmed is false and also count the total number of appointments based on appointmentConfirmed status.", + "target_collection": "Appointments", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "appointmentConfirmed", + "operator": "=", + "value": false + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "appointmentConfirmed", + "metrics": "PERCENTAGE_FALSE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 117, + "database_schema_index": 1, + "natural_language_query": "Find all clinics that are accepting new patients and group them by clinicName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find all clinics that are accepting new patients and group them by clinicName.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all clinics that are accepting new patients and group them by clinicName.", + "target_collection": "Clinics", + "search_query": "clinics that are accepting new patients", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 118, + "database_schema_index": 1, + "natural_language_query": "Find clinics where acceptingNewPatients is equal to true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics where acceptingNewPatients is equal to true.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics where acceptingNewPatients is equal to true.", + "target_collection": "Clinics", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 119, + "database_schema_index": 1, + "natural_language_query": "Determine the mean years of experience for doctors, categorized by their expertise.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Determine the mean years of experience for doctors, categorized by their expertise.", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "expertise" + }, + "predicted_query": { + "corresponding_natural_language_query": "Determine the mean years of experience for doctors, categorized by their expertise.", + "target_collection": "Doctors", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "expertise", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 120, + "database_schema_index": 1, + "natural_language_query": "Using the int_property_aggregation operator, calculate the total number of years of experience across all doctors by summing the 'yearsOfExperience' property in the Doctors collection.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Using the int_property_aggregation operator, calculate the total number of years of experience across all doctors by summing the 'yearsOfExperience' property in the Doctors collection.", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Using the int_property_aggregation operator, calculate the total number of years of experience across all doctors by summing the 'yearsOfExperience' property in the Doctors collection.", + "target_collection": "Doctors", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 121, + "database_schema_index": 1, + "natural_language_query": "What are the top 5 most common areas of expertise for doctors, grouped by whether they are currently practicing?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "What are the top 5 most common areas of expertise for doctors, grouped by whether they are currently practicing?", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "expertise", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the top 5 most common areas of expertise for doctors, grouped by whether they are currently practicing?", + "target_collection": "Doctors", + "search_query": "areas of expertise", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "total_count", + "metrics": "SUM" + }, + "text_property_aggregation": { + "property_name": "expertise", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": { + "property_name": "currentlyPracticing", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "currentlyPracticing", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 122, + "database_schema_index": 1, + "natural_language_query": "What are the top 5 most common clinicName entries in the Clinics collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "What are the top 5 most common clinicName entries in the Clinics collection?", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "clinicName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='TOP_OCCURRENCES', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 123, + "database_schema_index": 1, + "natural_language_query": "Calculate the percentage of clinics that are accepting new patients, grouped by their average patient satisfaction.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Calculate the percentage of clinics that are accepting new patients, grouped by their average patient satisfaction.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate the percentage of clinics that are accepting new patients, grouped by their average patient satisfaction.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 124, + "database_schema_index": 1, + "natural_language_query": "How many clinics are currently accepting new patients compared to those that are not?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "How many clinics are currently accepting new patients compared to those that are not?", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "How many clinics are currently accepting new patients compared to those that are not?", + "target_collection": "Clinics", + "search_query": "clinics accepting new patients", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "total_count", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_FALSE" + }, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + }, + { + "query_index": 125, + "database_schema_index": 1, + "natural_language_query": "Group clinics by their averagePatientSatisfaction scores to see the distribution of clinics based on patient satisfaction levels, organizing the results into different satisfaction categories.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Group clinics by their averagePatientSatisfaction scores to see the distribution of clinics based on patient satisfaction levels, organizing the results into different satisfaction categories.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": { + "corresponding_natural_language_query": "Group clinics by their averagePatientSatisfaction scores to see the distribution of clinics based on patient satisfaction levels, organizing the results into different satisfaction categories.", + "target_collection": "Clinics", + "search_query": "clinics", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 126, + "database_schema_index": 1, + "natural_language_query": "Show me students interested in 'learning algorithms' who have completed more than 20 completedCredits, aggregate the count of completedCredits for these students, and group the results by their enrolledFullTime status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Show me students interested in 'learning algorithms' who have completed more than 20 completedCredits, aggregate the count of completedCredits for these students, and group the results by their enrolledFullTime status.", + "target_collection": "Students", + "search_query": "learning algorithms", + "integer_property_filter": { + "property_name": "completedCredits", + "operator": ">", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "enrolledFullTime" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 127, + "database_schema_index": 1, + "natural_language_query": "Find students whose researchInterests include machine learning, filter those who have completedCredits of at least 30, and calculate the average completedCredits of these students.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find students whose researchInterests include machine learning, filter those who have completedCredits of at least 30, and calculate the average completedCredits of these students.", + "target_collection": "Students", + "search_query": "Find students whose researchInterests include machine learning", + "integer_property_filter": { + "property_name": "completedCredits", + "operator": ">=", + "value": 30 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "completedCredits", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find students whose researchInterests include machine learning, filter those who have completedCredits of at least 30, and calculate the average completedCredits of these students.", + "target_collection": "Students", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": { + "property_name": "completedCredits", + "operator": ">=", + "value": 30 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "completedCredits", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 128, + "database_schema_index": 2, + "natural_language_query": "Identify courses related to machine learning that have a courseDuration of at least 5 hours, and determine the most frequently occurring courseTitle.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify courses related to machine learning that have a courseDuration of at least 5 hours, and determine the most frequently occurring courseTitle.", + "target_collection": "Courses", + "search_query": "machine learning", + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify courses related to machine learning that have a courseDuration of at least 5 hours, and determine the most frequently occurring courseTitle.", + "target_collection": "Courses", + "search_query": "courses related to machine learning", + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 129, + "database_schema_index": 2, + "natural_language_query": "Find courses that semantically relate to data science and machine learning in their courseDescription, filter for those which courseDuration is at least 40 hours, and show the top 5 most common courseTitle values for these courses.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that semantically relate to data science and machine learning in their courseDescription, filter for those which courseDuration is at least 40 hours, and show the top 5 most common courseTitle values for these courses.", + "target_collection": "Courses", + "search_query": "data science and machine learning", + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 40 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that semantically relate to data science and machine learning in their courseDescription, filter for those which courseDuration is at least 40 hours, and show the top 5 most common courseTitle values for these courses.", + "target_collection": "Courses", + "search_query": "data science and machine learning", + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 40 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 130, + "database_schema_index": 2, + "natural_language_query": "List all courses related to artificial intelligence and machine learning that require at least 20 hours to complete, show the percentage of those courses currently accepting enrollments, and categorize the results by whether they are currently enrolling or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "List all courses related to artificial intelligence and machine learning that require at least 20 hours to complete, show the percentage of those courses currently accepting enrollments, and categorize the results by whether they are currently enrolling or not.", + "target_collection": "Courses", + "search_query": "Find courses related to artificial intelligence and machine learning.", + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "List all courses related to artificial intelligence and machine learning that require at least 20 hours to complete, show the percentage of those courses currently accepting enrollments, and categorize the results by whether they are currently enrolling or not.", + "target_collection": "Courses", + "search_query": "courses related to artificial intelligence and machine learning", + "limit": 5, + "integer_property_filter": { + "property_name": "requiredHours", + "operator": ">=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 131, + "database_schema_index": 2, + "natural_language_query": "Find courses that are similar to 'data science', have a courseDuration of 40 hours or less, and calculate the percentage of these courses that are currentlyEnrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that are similar to 'data science', have a courseDuration of 40 hours or less, and calculate the percentage of these courses that are currentlyEnrolling.", + "target_collection": "Courses", + "search_query": "Find courses similar to data science that enhance learning outcomes", + "integer_property_filter": { + "property_name": "courseDuration", + "operator": "<=", + "value": 40 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that are similar to 'data science', have a courseDuration of 40 hours or less, and calculate the percentage of these courses that are currentlyEnrolling.", + "target_collection": "Courses", + "search_query": "data science", + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": "<=", + "value": 40 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 132, + "database_schema_index": 2, + "natural_language_query": "Find students interested in machine learning who have completed at least 30 credits, grouped by whether they are enrolled full-time.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find students interested in machine learning who have completed at least 30 credits, grouped by whether they are enrolled full-time.", + "target_collection": "Students", + "search_query": "students interested in machine learning", + "integer_property_filter": { + "property_name": "completedCredits", + "operator": ">=", + "value": 30 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "enrolledFullTime" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find students interested in machine learning who have completed at least 30 credits, grouped by whether they are enrolled full-time.", + "target_collection": "Students", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": { + "property_name": "completedCredits", + "operator": ">=", + "value": 30 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "enrolledFullTime", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "enrolledFullTime", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 133, + "database_schema_index": 2, + "natural_language_query": "Find courses that relate to artificial intelligence which have a courseDuration of at least 20 hours.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that relate to artificial intelligence which have a courseDuration of at least 20 hours.", + "target_collection": "Courses", + "search_query": "Find courses related to artificial intelligence", + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that relate to artificial intelligence which have a courseDuration of at least 20 hours.", + "target_collection": "Courses", + "search_query": "courses that relate to artificial intelligence", + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 134, + "database_schema_index": 2, + "natural_language_query": "What is the average duration of courses related to artificial intelligence that are currently enrolling, and organize the results by course title?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the average duration of courses related to artificial intelligence that are currently enrolling, and organize the results by course title?", + "target_collection": "Courses", + "search_query": "artificial intelligence", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average duration of courses related to artificial intelligence that are currently enrolling, and organize the results by course title?", + "target_collection": "Courses", + "search_query": "courses related to artificial intelligence", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "duration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "enrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.925, + "error": null + }, + { + "query_index": 135, + "database_schema_index": 2, + "natural_language_query": "Search for courses whose descriptions are conceptually similar to 'machine learning and artificial intelligence', filter to find courses with the exact courseTitle 'Introduction to AI', and calculate the average courseDuration of these courses.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Search for courses whose descriptions are conceptually similar to 'machine learning and artificial intelligence', filter to find courses with the exact courseTitle 'Introduction to AI', and calculate the average courseDuration of these courses.", + "target_collection": "Courses", + "search_query": "Find me the courses that cover topics similar to 'machine learning and artificial intelligence'.", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "=", + "value": "Introduction to AI" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for courses whose descriptions are conceptually similar to 'machine learning and artificial intelligence', filter to find courses with the exact courseTitle 'Introduction to AI', and calculate the average courseDuration of these courses.", + "target_collection": "Courses", + "search_query": "machine learning and artificial intelligence", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "=", + "value": "Introduction to AI" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 136, + "database_schema_index": 2, + "natural_language_query": "Find courses related to data science and machine learning by courseDescription, filter these courses to only those that are currently open for enrollment, count the unique course titles, and then group the courses by their duration to analyze the number of courses segmented by different durations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses related to data science and machine learning by courseDescription, filter these courses to only those that are currently open for enrollment, count the unique course titles, and then group the courses by their duration to analyze the number of courses segmented by different durations.", + "target_collection": "Courses", + "search_query": "Find courses related to data science and machine learning by courseDescription", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses related to data science and machine learning by courseDescription, filter these courses to only those that are currently open for enrollment, count the unique course titles, and then group the courses by their duration to analyze the number of courses segmented by different durations.", + "target_collection": "Courses", + "search_query": "data science and machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "duration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 137, + "database_schema_index": 2, + "natural_language_query": "Find courses that focus on machine learning that are currently enrolling, and display the top 5 most common course titles.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that focus on machine learning that are currently enrolling, and display the top 5 most common course titles.", + "target_collection": "Courses", + "search_query": "Find courses that focus on machine learning", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that focus on machine learning that are currently enrolling, and display the top 5 most common course titles.", + "target_collection": "Courses", + "search_query": "courses that focus on machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "enrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "enrollment", + "metrics": "MAX" + }, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 138, + "database_schema_index": 2, + "natural_language_query": "Search for courses that focus on 'machine learning' topics, filter to include only those that have 'Data Science' in their course title, calculate the percentage of these courses that are currently enrolling, and group the results by course duration.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Search for courses that focus on 'machine learning' topics, filter to include only those that have 'Data Science' in their course title, calculate the percentage of these courses that are currently enrolling, and group the results by course duration.", + "target_collection": "Courses", + "search_query": "machine learning", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Data Science" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for courses that focus on 'machine learning' topics, filter to include only those that have 'Data Science' in their course title, calculate the percentage of these courses that are currently enrolling, and group the results by course duration.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Data Science" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseDuration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 139, + "database_schema_index": 2, + "natural_language_query": "Find instructors who are described as experienced in teaching computer science in their biography, specifically look for instructors named Jane Doe, and calculate the percentage of instructors who hold a tenured position in the 'tenured' field.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find instructors who are described as experienced in teaching computer science in their biography, specifically look for instructors named Jane Doe, and calculate the percentage of instructors who hold a tenured position in the 'tenured' field.", + "target_collection": "Instructors", + "search_query": "experienced in teaching computer science", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "instructorName", + "operator": "=", + "value": "Jane Doe" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "tenured", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find instructors who are described as experienced in teaching computer science in their biography, specifically look for instructors named Jane Doe, and calculate the percentage of instructors who hold a tenured position in the 'tenured' field.", + "target_collection": "Instructors", + "search_query": "experienced in teaching computer science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Jane Doe" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "tenured", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 140, + "database_schema_index": 2, + "natural_language_query": "Find courses related to Python programming where the course title contains 'Introduction', and group the results by whether the courses are currently enrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses related to Python programming where the course title contains 'Introduction', and group the results by whether the courses are currently enrolling.", + "target_collection": "Courses", + "search_query": "Python programming", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "%Introduction%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses related to Python programming where the course title contains 'Introduction', and group the results by whether the courses are currently enrolling.", + "target_collection": "Courses", + "search_query": "Python programming", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Introduction" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 141, + "database_schema_index": 2, + "natural_language_query": "Show me courses that cover 'machine learning fundamentals' in their descriptions and have the word 'Advanced' in the course title.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Show me courses that cover 'machine learning fundamentals' in their descriptions and have the word 'Advanced' in the course title.", + "target_collection": "Courses", + "search_query": "Find courses that cover 'machine learning fundamentals' in courseDescription", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Advanced" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "3 validation errors for IntPropertyFilter\nproperty_name\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\noperator\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\nvalue\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing" + }, + { + "query_index": 142, + "database_schema_index": 2, + "natural_language_query": "Search for courses related to machine learning and deep learning that are currently open for enrollment, calculate the average duration of these courses, and categorize the results based on the enrollment status of the courses.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Search for courses related to machine learning and deep learning that are currently open for enrollment, calculate the average duration of these courses, and categorize the results based on the enrollment status of the courses.", + "target_collection": "Courses", + "search_query": "Find courses related to machine learning and deep learning exploration", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for courses related to machine learning and deep learning that are currently open for enrollment, calculate the average duration of these courses, and categorize the results based on the enrollment status of the courses.", + "target_collection": "Courses", + "search_query": "machine learning and deep learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "duration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "enrollmentStatus", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "enrollmentStatus", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.775, + "error": null + }, + { + "query_index": 143, + "database_schema_index": 2, + "natural_language_query": "What are the courses related to 'machine learning' that are currently enrolling, and what is the average course duration?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What are the courses related to 'machine learning' that are currently enrolling, and what is the average course duration?", + "target_collection": "Courses", + "search_query": "Find courses related to 'machine learning' based on courseDescription", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the courses related to 'machine learning' that are currently enrolling, and what is the average course duration?", + "target_collection": "Courses", + "search_query": "courses related to 'machine learning'", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "enrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "duration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9, + "error": null + }, + { + "query_index": 144, + "database_schema_index": 2, + "natural_language_query": "Find courses related to \"machine learning\" in courseDescription that are currently enrolling, count the number of unique courses titles, and group the results by courseDuration.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses related to \"machine learning\" in courseDescription that are currently enrolling, count the number of unique courses titles, and group the results by courseDuration.", + "target_collection": "Courses", + "search_query": "Find courses related to \"machine learning\" in courseDescription", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 145, + "database_schema_index": 2, + "natural_language_query": "Find courses that are related to data science in courseDescription, are currently enrolling as indicated by currentlyEnrolling being true, and return the top 5 most popular course titles using courseTitle.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that are related to data science in courseDescription, are currently enrolling as indicated by currentlyEnrolling being true, and return the top 5 most popular course titles using courseTitle.", + "target_collection": "Courses", + "search_query": "Data Science", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that are related to data science in courseDescription, are currently enrolling as indicated by currentlyEnrolling being true, and return the top 5 most popular course titles using courseTitle.", + "target_collection": "Courses", + "search_query": "data science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 146, + "database_schema_index": 2, + "natural_language_query": "What are the currently enrolling courses related to 'machine learning applied techniques', and how is the enrollment status distributed across these courses by course title?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What are the currently enrolling courses related to 'machine learning applied techniques', and how is the enrollment status distributed across these courses by course title?", + "target_collection": "Courses", + "search_query": "Find courses related to 'machine learning applied techniques' in courseDescription", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the currently enrolling courses related to 'machine learning applied techniques', and how is the enrollment status distributed across these courses by course title?", + "target_collection": "Courses", + "search_query": "machine learning applied techniques", + "limit": 5, + "integer_property_filter": { + "property_name": "enrollment", + "operator": ">", + "value": 0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 147, + "database_schema_index": 2, + "natural_language_query": "Find courses by topics related to artificial intelligence, filter to only include those that are currently open for enrollment, and calculate the percentage of total courses that are currently enrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses by topics related to artificial intelligence, filter to only include those that are currently open for enrollment, and calculate the percentage of total courses that are currently enrolling.", + "target_collection": "Courses", + "search_query": "Find courses by topics related to artificial intelligence", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses by topics related to artificial intelligence, filter to only include those that are currently open for enrollment, and calculate the percentage of total courses that are currently enrolling.", + "target_collection": "Courses", + "search_query": "topics related to artificial intelligence", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9, + "error": null + }, + { + "query_index": 148, + "database_schema_index": 2, + "natural_language_query": "Find courses related to data science that are currently enrolling, and group these courses by their courseDuration to see how they vary by length.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses related to data science that are currently enrolling, and group these courses by their courseDuration to see how they vary by length.", + "target_collection": "Courses", + "search_query": "Find courses with subjects related to 'data science'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses related to data science that are currently enrolling, and group these courses by their courseDuration to see how they vary by length.", + "target_collection": "Courses", + "search_query": "courses related to data science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "enrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 149, + "database_schema_index": 2, + "natural_language_query": "Find courses with topics related to 'machine learning techniques' that are currently enrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses with topics related to 'machine learning techniques' that are currently enrolling.", + "target_collection": "Courses", + "search_query": "Find courses with topics related to 'machine learning techniques'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "3 validation errors for IntPropertyFilter\nproperty_name\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\noperator\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\nvalue\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing" + }, + { + "query_index": 150, + "database_schema_index": 2, + "natural_language_query": "What is the average course duration of courses related to 'machine learning fundamentals', and how does it vary between courses that are currently enrolling and those that are not?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the average course duration of courses related to 'machine learning fundamentals', and how does it vary between courses that are currently enrolling and those that are not?", + "target_collection": "Courses", + "search_query": "Find courses that match the phrase 'machine learning fundamentals'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average course duration of courses related to 'machine learning fundamentals', and how does it vary between courses that are currently enrolling and those that are not?", + "target_collection": "Courses", + "search_query": "machine learning fundamentals", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "enrollingNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "enrollingNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 151, + "database_schema_index": 2, + "natural_language_query": "Find courses that are conceptually similar to 'data science' and calculate the average course duration in courseDuration.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that are conceptually similar to 'data science' and calculate the average course duration in courseDuration.", + "target_collection": "Courses", + "search_query": "Find courses that best match the concept of 'data science'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that are conceptually similar to 'data science' and calculate the average course duration in courseDuration.", + "target_collection": "Courses", + "search_query": "data science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 152, + "database_schema_index": 2, + "natural_language_query": "Find students who have research interests similar to quantum computing and determine the count of unique research interests, while grouping the results by whether they are enrolled full-time.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find students who have research interests similar to quantum computing and determine the count of unique research interests, while grouping the results by whether they are enrolled full-time.", + "target_collection": "Students", + "search_query": "quantum computing", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "enrolledFullTime" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 153, + "database_schema_index": 2, + "natural_language_query": "Find courses that are conceptually similar to 'machine learning', are currently enrolling, and identify the top 3 most common course titles.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that are conceptually similar to 'machine learning', are currently enrolling, and identify the top 3 most common course titles.", + "target_collection": "Courses", + "search_query": "Find courses related to 'machine learning' that are open for enrollment", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that are conceptually similar to 'machine learning', are currently enrolling, and identify the top 3 most common course titles.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "enrollmentCount", + "metrics": "SUM" + }, + "text_property_aggregation": { + "property_name": "title", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.925, + "error": null + }, + { + "query_index": 154, + "database_schema_index": 2, + "natural_language_query": "Find the most relevant students based on research interests around 'machine learning', calculate the percentage of those students enrolled full-time, and group the results by their research interests.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find the most relevant students based on research interests around 'machine learning', calculate the percentage of those students enrolled full-time, and group the results by their research interests.", + "target_collection": "Students", + "search_query": "Find the most relevant students based on research interests around 'machine learning'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "enrolledFullTime", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "researchInterests" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='PERCENTAGE_TRUE', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 155, + "database_schema_index": 2, + "natural_language_query": "Find the number of courses with courseTitle or courseDescription related to 'Data Science', and summarize how many of these courses are currently open for enrollment.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find the number of courses with courseTitle or courseDescription related to 'Data Science', and summarize how many of these courses are currently open for enrollment.", + "target_collection": "Courses", + "search_query": "Data Science", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the number of courses with courseTitle or courseDescription related to 'Data Science', and summarize how many of these courses are currently open for enrollment.", + "target_collection": "Courses", + "search_query": "Data Science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "total_count", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 156, + "database_schema_index": 2, + "natural_language_query": "Find courses whose courseDescription is similar to 'machine learning foundations' and group these courses by their currentlyEnrolling status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses whose courseDescription is similar to 'machine learning foundations' and group these courses by their currentlyEnrolling status.", + "target_collection": "Courses", + "search_query": "Find courses whose courseDescription is similar to 'machine learning foundations'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses whose courseDescription is similar to 'machine learning foundations' and group these courses by their currentlyEnrolling status.", + "target_collection": "Courses", + "search_query": "machine learning foundations", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "total_enrolled", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 157, + "database_schema_index": 2, + "natural_language_query": "Find courses with a courseDescription that covers the entire data science lifecycle, including data collection, processing, analysis, and presentation.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses with a courseDescription that covers the entire data science lifecycle, including data collection, processing, analysis, and presentation.", + "target_collection": "Courses", + "search_query": "Find courses that cover the entire data science lifecycle, including data collection, processing, analysis, and presentation.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "2 validation errors for IntAggregation\nproperty_name\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\nmetrics\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing" + }, + { + "query_index": 158, + "database_schema_index": 2, + "natural_language_query": "Count the number of instructors grouped by tenured status who have at least 10 years in yearsOfTeaching.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Count the number of instructors grouped by tenured status who have at least 10 years in yearsOfTeaching.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured" + }, + "predicted_query": { + "corresponding_natural_language_query": "Count the number of instructors grouped by tenured status who have at least 10 years in yearsOfTeaching.", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "tenured", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "tenured", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 159, + "database_schema_index": 2, + "natural_language_query": "Find the total number of instructors who have been teaching for at least 10 years based on their yearsOfTeaching.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find the total number of instructors who have been teaching for at least 10 years based on their yearsOfTeaching.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the total number of instructors who have been teaching for at least 10 years based on their yearsOfTeaching.", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfTeaching", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 160, + "database_schema_index": 2, + "natural_language_query": "Identify instructors who have been teaching for at least 10 years. For these instructors, summarize how frequently different words appear in their biography, and categorize them based on whether they hold tenured positions.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify instructors who have been teaching for at least 10 years. For these instructors, summarize how frequently different words appear in their biography, and categorize them based on whether they hold tenured positions.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify instructors who have been teaching for at least 10 years. For these instructors, summarize how frequently different words appear in their biography, and categorize them based on whether they hold tenured positions.", + "target_collection": "Instructors", + "search_query": "instructors who have been teaching for at least 10 years", + "limit": 5, + "integer_property_filter": { + "property_name": "yearsTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "biography", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": { + "property_name": "tenured", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "tenured", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 161, + "database_schema_index": 2, + "natural_language_query": "Find instructors who have at least 10 yearsOfTeaching and determine the top 5 most common attributes mentioned in their biography.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find instructors who have at least 10 yearsOfTeaching and determine the top 5 most common attributes mentioned in their biography.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "biography", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find instructors who have at least 10 yearsOfTeaching and determine the top 5 most common attributes mentioned in their biography.", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "biography", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 162, + "database_schema_index": 2, + "natural_language_query": "Find all instructors with more than 5 years in yearsOfTeaching, show the count of tenured status and group the results by instructorName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find all instructors with more than 5 years in yearsOfTeaching, show the count of tenured status and group the results by instructorName.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "instructorName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all instructors with more than 5 years in yearsOfTeaching, show the count of tenured status and group the results by instructorName.", + "target_collection": "Instructors", + "search_query": "instructors with more than 5 years in yearsOfTeaching", + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "tenuredStatus", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "instructorName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 163, + "database_schema_index": 2, + "natural_language_query": "Find courses with a courseDuration of at least 20 hours and determine how many of these are currently enrolling by counting the boolean currentlyEnrolling field.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses with a courseDuration of at least 20 hours and determine how many of these are currently enrolling by counting the boolean currentlyEnrolling field.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses with a courseDuration of at least 20 hours and determine how many of these are currently enrolling by counting the boolean currentlyEnrolling field.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 164, + "database_schema_index": 2, + "natural_language_query": "Identify instructors who have more than 10 years of teaching experience and group them by whether they hold a tenured position.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify instructors who have more than 10 years of teaching experience and group them by whether they hold a tenured position.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify instructors who have more than 10 years of teaching experience and group them by whether they hold a tenured position.", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "teachingExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "tenuredPosition", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "tenuredPosition", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 165, + "database_schema_index": 2, + "natural_language_query": "Find courses that have a courseDuration greater than 10 hours.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that have a courseDuration greater than 10 hours.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that have a courseDuration greater than 10 hours.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 166, + "database_schema_index": 2, + "natural_language_query": "Find all courses containing 'machine learning' in the courseDescription, then group them by currentlyEnrolling status and determine the maximum courseDuration in each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find all courses containing 'machine learning' in the courseDescription, then group them by currentlyEnrolling status and determine the maximum courseDuration in each group.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "machine learning" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all courses containing 'machine learning' in the courseDescription, then group them by currentlyEnrolling status and determine the maximum courseDuration in each group.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 167, + "database_schema_index": 2, + "natural_language_query": "Find the average courseDuration of all courses that have 'Python' in their courseDescription.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find the average courseDuration of all courses that have 'Python' in their courseDescription.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "Python" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the average courseDuration of all courses that have 'Python' in their courseDescription.", + "target_collection": "Courses", + "search_query": "Python", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 168, + "database_schema_index": 2, + "natural_language_query": "Identify whether courses that mention 'machine learning' in their courseDescription are currently enrolling, group these courses by their currentlyEnrolling status, and list the top 5 most common courseTitles for each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify whether courses that mention 'machine learning' in their courseDescription are currently enrolling, group these courses by their currentlyEnrolling status, and list the top 5 most common courseTitles for each group.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "machine learning" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify whether courses that mention 'machine learning' in their courseDescription are currently enrolling, group these courses by their currentlyEnrolling status, and list the top 5 most common courseTitles for each group.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 169, + "database_schema_index": 2, + "natural_language_query": "Find and count courses with 'data science' in the courseDescription by using the courseDescription text_property_filter with LIKE, and count the total number of different course titles using courseTitle text_property_aggregation COUNT.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find and count courses with 'data science' in the courseDescription by using the courseDescription text_property_filter with LIKE, and count the total number of different course titles using courseTitle text_property_aggregation COUNT.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "data science" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find and count courses with 'data science' in the courseDescription by using the courseDescription text_property_filter with LIKE, and count the total number of different course titles using courseTitle text_property_aggregation COUNT.", + "target_collection": "Courses", + "search_query": "data science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseTitle", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 170, + "database_schema_index": 2, + "natural_language_query": "Identify all courses that include 'Data Science' in their courseTitle, count how many of these courses are currentlyEnrolling, and group the results by courseDuration to show how courses of different durations are distributed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify all courses that include 'Data Science' in their courseTitle, count how many of these courses are currentlyEnrolling, and group the results by courseDuration to show how courses of different durations are distributed.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Data Science" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify all courses that include 'Data Science' in their courseTitle, count how many of these courses are currentlyEnrolling, and group the results by courseDuration to show how courses of different durations are distributed.", + "target_collection": "Courses", + "search_query": "Data Science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "courseDuration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 171, + "database_schema_index": 2, + "natural_language_query": "Find courses where the courseTitle contains 'Advanced' and calculate the percentage of these that are currentlyEnrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses where the courseTitle contains 'Advanced' and calculate the percentage of these that are currentlyEnrolling.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Advanced" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses where the courseTitle contains 'Advanced' and calculate the percentage of these that are currentlyEnrolling.", + "target_collection": "Courses", + "search_query": "Advanced", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 172, + "database_schema_index": 2, + "natural_language_query": "Find courses containing 'Introduction to Data Science' in the courseTitle, and group the results by currentlyEnrolling status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses containing 'Introduction to Data Science' in the courseTitle, and group the results by currentlyEnrolling status.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Introduction to Data Science" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses containing 'Introduction to Data Science' in the courseTitle, and group the results by currentlyEnrolling status.", + "target_collection": "Courses", + "search_query": "Introduction to Data Science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 173, + "database_schema_index": 2, + "natural_language_query": "Find courses where the courseDescription includes the phrase 'machine learning'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses where the courseDescription includes the phrase 'machine learning'.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "machine learning" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "3 validation errors for IntPropertyFilter\nproperty_name\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\noperator\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\nvalue\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing" + }, + { + "query_index": 174, + "database_schema_index": 2, + "natural_language_query": "Find courses that are currently enrolling and group them by courseTitle, calculating the total sum of courseDuration for each courseTitle.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that are currently enrolling and group them by courseTitle, calculating the total sum of courseDuration for each courseTitle.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that are currently enrolling and group them by courseTitle, calculating the total sum of courseDuration for each courseTitle.", + "target_collection": "Courses", + "search_query": "courses that are currently enrolling", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "enrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 175, + "database_schema_index": 2, + "natural_language_query": "What is the total number of hours required to complete all courses that are currently open for enrollment?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the total number of hours required to complete all courses that are currently open for enrollment?", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the total number of hours required to complete all courses that are currently open for enrollment?", + "target_collection": "Courses", + "search_query": "courses that are currently open for enrollment", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "totalHours", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.75, + "error": null + }, + { + "query_index": 176, + "database_schema_index": 2, + "natural_language_query": "Identify courses that are currently open for enrollment (using currentlyEnrolling = true), and group them by courseDuration while aggregating the top 5 most common courseTitle values.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify courses that are currently open for enrollment (using currentlyEnrolling = true), and group them by courseDuration while aggregating the top 5 most common courseTitle values.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify courses that are currently open for enrollment (using currentlyEnrolling = true), and group them by courseDuration while aggregating the top 5 most common courseTitle values.", + "target_collection": "Courses", + "search_query": "courses currently open for enrollment", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 177, + "database_schema_index": 2, + "natural_language_query": "Retrieve courses that are currentlyEnrolling and count the number of unique courseTitle entries to understand how many different courses are currently open for enrollment.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Retrieve courses that are currentlyEnrolling and count the number of unique courseTitle entries to understand how many different courses are currently open for enrollment.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 178, + "database_schema_index": 2, + "natural_language_query": "Find courses where currentlyEnrolling is true, calculate the percentage of such courses, and group the results by courseTitle to see enrollment status per course.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses where currentlyEnrolling is true, calculate the percentage of such courses, and group the results by courseTitle to see enrollment status per course.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses where currentlyEnrolling is true, calculate the percentage of such courses, and group the results by courseTitle to see enrollment status per course.", + "target_collection": "Courses", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 179, + "database_schema_index": 2, + "natural_language_query": "Find all courses that are currently open for enrollment and calculate the total number of courses where the currentlyEnrolling property is true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find all courses that are currently open for enrollment and calculate the total number of courses where the currentlyEnrolling property is true.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all courses that are currently open for enrollment and calculate the total number of courses where the currentlyEnrolling property is true.", + "target_collection": "Courses", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 180, + "database_schema_index": 2, + "natural_language_query": "Find all course titles where courses are currently enrolling and group the results by course title.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find all course titles where courses are currently enrolling and group the results by course title.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all course titles where courses are currently enrolling and group the results by course title.", + "target_collection": "Courses", + "search_query": "course titles where courses are currently enrolling", + "limit": 5, + "integer_property_filter": { + "property_name": "enrollmentCount", + "operator": ">", + "value": 0 + }, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 181, + "database_schema_index": 2, + "natural_language_query": "Find courses where currentlyEnrolling is true", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses where currentlyEnrolling is true", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses where currentlyEnrolling is true", + "target_collection": "Courses", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 182, + "database_schema_index": 2, + "natural_language_query": "What is the average yearsOfTeaching of instructors, grouped by their tenured status?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the average yearsOfTeaching of instructors, grouped by their tenured status?", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfTeaching", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average yearsOfTeaching of instructors, grouped by their tenured status?", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfTeaching", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenuredStatus", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 183, + "database_schema_index": 2, + "natural_language_query": "What is the average and maximum number of years instructors have been teaching in the yearsOfTeaching property of the Instructors collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the average and maximum number of years instructors have been teaching in the yearsOfTeaching property of the Instructors collection?", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfTeaching", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "src.models.IntAggregation() argument after ** must be a mapping, not list" + }, + { + "query_index": 184, + "database_schema_index": 2, + "natural_language_query": "What is the count of each unique courseTitle for Courses, grouped by their currentlyEnrolling status?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the count of each unique courseTitle for Courses, grouped by their currentlyEnrolling status?", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the count of each unique courseTitle for Courses, grouped by their currentlyEnrolling status?", + "target_collection": "Courses", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 185, + "database_schema_index": 2, + "natural_language_query": "Count unique courseTitle values and find the top 5 most common course titles.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Count unique courseTitle values and find the top 5 most common course titles.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 186, + "database_schema_index": 2, + "natural_language_query": "What percentage of courses are currently open for enrollment and how are these courses grouped by course duration?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What percentage of courses are currently open for enrollment and how are these courses grouped by course duration?", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "What percentage of courses are currently open for enrollment and how are these courses grouped by course duration?", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "duration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 187, + "database_schema_index": 2, + "natural_language_query": "Calculate how many courses in the Courses collection are currently open for enrollment, and determine the percentage of courses that are currently enrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Calculate how many courses in the Courses collection are currently open for enrollment, and determine the percentage of courses that are currently enrolling.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate how many courses in the Courses collection are currently open for enrollment, and determine the percentage of courses that are currently enrolling.", + "target_collection": "Courses", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 188, + "database_schema_index": 2, + "natural_language_query": "What is the average years of teaching for instructors grouped by their tenured status using groupby on tenured?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the average years of teaching for instructors grouped by their tenured status using groupby on tenured?", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average years of teaching for instructors grouped by their tenured status using groupby on tenured?", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfTeaching", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 189, + "database_schema_index": 2, + "natural_language_query": "What is the average packagePrice of travel packages whose packageDetails correspond to 'tropical beach relaxation' and have a price less than $1500, grouped by whether a discount is available?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What is the average packagePrice of travel packages whose packageDetails correspond to 'tropical beach relaxation' and have a price less than $1500, grouped by whether a discount is available?", + "target_collection": "TravelPackages", + "search_query": "Find travel packages whose packageDetails match 'tropical beach relaxation'", + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average packagePrice of travel packages whose packageDetails correspond to 'tropical beach relaxation' and have a price less than $1500, grouped by whether a discount is available?", + "target_collection": "TravelPackages", + "search_query": "tropical beach relaxation", + "limit": 5, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 190, + "database_schema_index": 2, + "natural_language_query": "Find travel destinations that are related to exotic beaches and vibrant nightlife but have an averageVisitCost of no more than $1500. Additionally, determine the maximum averageVisitCost among destinations that are popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that are related to exotic beaches and vibrant nightlife but have an averageVisitCost of no more than $1500. Additionally, determine the maximum averageVisitCost among destinations that are popular.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations related to exotic beaches and vibrant nightlife from destinationDescription", + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that are related to exotic beaches and vibrant nightlife but have an averageVisitCost of no more than $1500. Additionally, determine the maximum averageVisitCost among destinations that are popular.", + "target_collection": "TravelDestinations", + "search_query": "exotic beaches and vibrant nightlife", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 191, + "database_schema_index": 2, + "natural_language_query": "Find destinations where the description includes 'hot and sunny beaches with vibrant nightlife', the averageVisitCost is less than or equal to 1500, count how many destinations are popular, and group the results by destinationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find destinations where the description includes 'hot and sunny beaches with vibrant nightlife', the averageVisitCost is less than or equal to 1500, count how many destinations are popular, and group the results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "hot and sunny beaches with vibrant nightlife", + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find destinations where the description includes 'hot and sunny beaches with vibrant nightlife', the averageVisitCost is less than or equal to 1500, count how many destinations are popular, and group the results by destinationName.", + "target_collection": "Destinations", + "search_query": "hot and sunny beaches with vibrant nightlife", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 192, + "database_schema_index": 3, + "natural_language_query": "Find travel packages that include safaris and beaches with a packagePrice less than 1000. Also, count how many times each packageName appears in the results.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel packages that include safaris and beaches with a packagePrice less than 1000. Also, count how many times each packageName appears in the results.", + "target_collection": "TravelPackages", + "search_query": "Find travel packages that include safaris and beaches", + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<", + "value": 1000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel packages that include safaris and beaches with a packagePrice less than 1000. Also, count how many times each packageName appears in the results.", + "target_collection": "TravelPackages", + "search_query": "safaris and beaches", + "limit": 5, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<", + "value": 1000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "packageName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 193, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that offer peaceful beach vacations, where the averageVisitCost is less than or equal to 1500, count how many of these are popular, and group the results by destinationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that offer peaceful beach vacations, where the averageVisitCost is less than or equal to 1500, count how many of these are popular, and group the results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations that offer peaceful beach vacations", + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that offer peaceful beach vacations, where the averageVisitCost is less than or equal to 1500, count how many of these are popular, and group the results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "peaceful beach vacations", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 194, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations with beautiful beaches and rich cultural experiences where the averageVisitCost is no more than 1500, and determine what percentage of these destinations are currently popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations with beautiful beaches and rich cultural experiences where the averageVisitCost is no more than 1500, and determine what percentage of these destinations are currently popular.", + "target_collection": "TravelDestinations", + "search_query": "I want to find travel destinations with beautiful beaches and rich cultural experiences.", + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations with beautiful beaches and rich cultural experiences where the averageVisitCost is no more than 1500, and determine what percentage of these destinations are currently popular.", + "target_collection": "TravelDestinations", + "search_query": "beautiful beaches and rich cultural experiences", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 195, + "database_schema_index": 3, + "natural_language_query": "Search for a relaxing vacation package that includes beach activities and cultural tours, filter for packages with a packagePrice greater than 2000, and organize the results based on whether a discount is available, using discountAvailable as the grouping property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Search for a relaxing vacation package that includes beach activities and cultural tours, filter for packages with a packagePrice greater than 2000, and organize the results based on whether a discount is available, using discountAvailable as the grouping property.", + "target_collection": "TravelPackages", + "search_query": "A relaxing vacation package with beach activities and cultural tours", + "integer_property_filter": { + "property_name": "packagePrice", + "operator": ">", + "value": 2000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for a relaxing vacation package that includes beach activities and cultural tours, filter for packages with a packagePrice greater than 2000, and organize the results based on whether a discount is available, using discountAvailable as the grouping property.", + "target_collection": "VacationPackages", + "search_query": "relaxing vacation package beach activities cultural tours", + "limit": 5, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": ">", + "value": 2000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 196, + "database_schema_index": 3, + "natural_language_query": "Find travel packages described as a 'relaxing beach holiday' with a packagePrice of at most $500.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel packages described as a 'relaxing beach holiday' with a packagePrice of at most $500.", + "target_collection": "TravelPackages", + "search_query": "Find travel packages described as a 'relaxing beach holiday'.", + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<=", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel packages described as a 'relaxing beach holiday' with a packagePrice of at most $500.", + "target_collection": "TravelPackages", + "search_query": "relaxing beach holiday", + "limit": 5, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<=", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destination", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 197, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations with descriptions similar to 'beach and cultural experiences', filter for destinations named Bali, calculate the average of averageVisitCost, and group by whether destinations are popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations with descriptions similar to 'beach and cultural experiences', filter for destinations named Bali, calculate the average of averageVisitCost, and group by whether destinations are popular.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations with descriptions similar to 'beach and cultural experiences'", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "=", + "value": "Bali" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations with descriptions similar to 'beach and cultural experiences', filter for destinations named Bali, calculate the average of averageVisitCost, and group by whether destinations are popular.", + "target_collection": "TravelDestinations", + "search_query": "beach and cultural experiences", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Bali" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "popular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 198, + "database_schema_index": 3, + "natural_language_query": "Find destinations whose descriptions semantically emphasize beautiful landscapes, specifically retrieve destinations named \"Bora Bora\", and determine the maximum average visit cost among all destinations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find destinations whose descriptions semantically emphasize beautiful landscapes, specifically retrieve destinations named \"Bora Bora\", and determine the maximum average visit cost among all destinations.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations with descriptions that emphasize beautiful landscapes", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "=", + "value": "Bora Bora" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find destinations whose descriptions semantically emphasize beautiful landscapes, specifically retrieve destinations named \"Bora Bora\", and determine the maximum average visit cost among all destinations.", + "target_collection": "Destinations", + "search_query": "beautiful landscapes", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Bora Bora" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 199, + "database_schema_index": 3, + "natural_language_query": "Find the most frequently occurring travel destinations that are popular among tourists, and match the phrase 'tropical beaches with vibrant nightlife', grouping them by their names and aggregating the count of each destination name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find the most frequently occurring travel destinations that are popular among tourists, and match the phrase 'tropical beaches with vibrant nightlife', grouping them by their names and aggregating the count of each destination name.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that match the phrase 'tropical beaches with vibrant nightlife'", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "popular", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the most frequently occurring travel destinations that are popular among tourists, and match the phrase 'tropical beaches with vibrant nightlife', grouping them by their names and aggregating the count of each destination name.", + "target_collection": "TravelDestinations", + "search_query": "tropical beaches with vibrant nightlife", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 200, + "database_schema_index": 3, + "natural_language_query": "Find destinations with tropical experiences as described in the destinationDescription, locate destinations that have 'Beach' included in the destinationName, and count how many destinations are currently marked as popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find destinations with tropical experiences as described in the destinationDescription, locate destinations that have 'Beach' included in the destinationName, and count how many destinations are currently marked as popular.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations with tropical experiences in destinationDescription", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "Beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find destinations with tropical experiences as described in the destinationDescription, locate destinations that have 'Beach' included in the destinationName, and count how many destinations are currently marked as popular.", + "target_collection": "Destinations", + "search_query": "tropical experiences", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "Beach" + }, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 201, + "database_schema_index": 3, + "natural_language_query": "Find destinations with a description similar to 'scenic views', filter those with 'island' in their destinationName, group results by destinationName, and calculate the percentage of popular destinations within each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find destinations with a description similar to 'scenic views', filter those with 'island' in their destinationName, group results by destinationName, and calculate the percentage of popular destinations within each group.", + "target_collection": "TravelDestinations", + "search_query": "scenic views", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "%island%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find destinations with a description similar to 'scenic views', filter those with 'island' in their destinationName, group results by destinationName, and calculate the percentage of popular destinations within each group.", + "target_collection": "Destinations", + "search_query": "scenic views", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "island" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 202, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that are relevant to a charming winter holiday experience with various activities. Additionally, filter results to include only destinations named 'Swiss Alps', and count how many of these destinations are currently popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that are relevant to a charming winter holiday experience with various activities. Additionally, filter results to include only destinations named 'Swiss Alps', and count how many of these destinations are currently popular.", + "target_collection": "TravelDestinations", + "search_query": "I am looking for a charming winter holiday experience with various activities.", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "=", + "value": "Swiss Alps" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that are relevant to a charming winter holiday experience with various activities. Additionally, filter results to include only destinations named 'Swiss Alps', and count how many of these destinations are currently popular.", + "target_collection": "TravelDestinations", + "search_query": "charming winter holiday experience", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Swiss Alps" + }, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.925, + "error": null + }, + { + "query_index": 203, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that offer a cultural experience in their description, include 'Paris' in the destination name, and group the results by whether they are currently popular among tourists.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that offer a cultural experience in their description, include 'Paris' in the destination name, and group the results by whether they are currently popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": "A cultural experience", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "%Paris%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that offer a cultural experience in their description, include 'Paris' in the destination name, and group the results by whether they are currently popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": "cultural experience", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "Paris" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popularAmongTourists", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 204, + "database_schema_index": 3, + "natural_language_query": "Find travel packages that are conceptually similar to a relaxing beach vacation and have 'Caribbean' in the packageName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel packages that are conceptually similar to a relaxing beach vacation and have 'Caribbean' in the packageName.", + "target_collection": "TravelPackages", + "search_query": "relaxing beach vacation", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "packageName", + "operator": "LIKE", + "value": "Caribbean" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel packages that are conceptually similar to a relaxing beach vacation and have 'Caribbean' in the packageName.", + "target_collection": "TravelPackages", + "search_query": "relaxing beach vacation", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "packageName", + "operator": "LIKE", + "value": "Caribbean" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 205, + "database_schema_index": 3, + "natural_language_query": "Search for travel destinations with scenic beaches and vibrant local culture, filter for those that are currently popular, calculate the average cost to visit, and group by destination name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Search for travel destinations with scenic beaches and vibrant local culture, filter for those that are currently popular, calculate the average cost to visit, and group by destination name.", + "target_collection": "TravelDestinations", + "search_query": "Scenic beaches with vibrant local culture", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for travel destinations with scenic beaches and vibrant local culture, filter for those that are currently popular, calculate the average cost to visit, and group by destination name.", + "target_collection": "TravelDestinations", + "search_query": "scenic beaches and vibrant local culture", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 206, + "database_schema_index": 3, + "natural_language_query": "Identify popular travel destinations described as tropical beaches and places with rich cultural history, and compute the average cost of visiting these popular locations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Identify popular travel destinations described as tropical beaches and places with rich cultural history, and compute the average cost of visiting these popular locations.", + "target_collection": "TravelDestinations", + "search_query": "Find tropical beaches and cultural destinations with rich histories.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify popular travel destinations described as tropical beaches and places with rich cultural history, and compute the average cost of visiting these popular locations.", + "target_collection": "TravelDestinations", + "search_query": "tropical beaches and places with rich cultural history", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 207, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations related to beach vacations that are popular, categorize them by destinationName, and identify the top 5 most common destination names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations related to beach vacations that are popular, categorize them by destinationName, and identify the top 5 most common destination names.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations related to beach vacations", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations related to beach vacations that are popular, categorize them by destinationName, and identify the top 5 most common destination names.", + "target_collection": "TravelDestinations", + "search_query": "beach vacations", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "popularity", + "metrics": "MEAN" + }, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 208, + "database_schema_index": 3, + "natural_language_query": "Find the most relevant travel destinations with scenic beaches and vibrant nightlife among those that are currently popular, and count how many travel destinations are there.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find the most relevant travel destinations with scenic beaches and vibrant nightlife among those that are currently popular, and count how many travel destinations are there.", + "target_collection": "TravelDestinations", + "search_query": "description: 'Describe destinations with scenic beaches and vibrant nightlife'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the most relevant travel destinations with scenic beaches and vibrant nightlife among those that are currently popular, and count how many travel destinations are there.", + "target_collection": "TravelDestinations", + "search_query": "scenic beaches and vibrant nightlife", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isPopular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "id", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 209, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that match 'tropical beaches with vibrant cultures' in their destinationDescription, filter them to show only those that are currently popular, calculate the percentage of destinations that are popular, and group the results by destinationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that match 'tropical beaches with vibrant cultures' in their destinationDescription, filter them to show only those that are currently popular, calculate the percentage of destinations that are popular, and group the results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that match 'tropical beaches with vibrant cultures' in destinationDescription", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that match 'tropical beaches with vibrant cultures' in their destinationDescription, filter them to show only those that are currently popular, calculate the percentage of destinations that are popular, and group the results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "tropical beaches with vibrant cultures", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 210, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations with sunny beaches and vibrant nightlife, filter for where they are currently popular, and count these popular destinations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations with sunny beaches and vibrant nightlife, filter for where they are currently popular, and count these popular destinations.", + "target_collection": "TravelDestinations", + "search_query": "sunny beaches and vibrant nightlife", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations with sunny beaches and vibrant nightlife, filter for where they are currently popular, and count these popular destinations.", + "target_collection": "TravelDestinations", + "search_query": "sunny beaches and vibrant nightlife", + "limit": 5, + "integer_property_filter": { + "property_name": "popularity", + "operator": ">", + "value": 0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "popularity", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPopular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 211, + "database_schema_index": 3, + "natural_language_query": "Find popular travel destinations with descriptions that include scenic vistas and vibrant cultures, and group these destinations by their destinationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find popular travel destinations with descriptions that include scenic vistas and vibrant cultures, and group these destinations by their destinationName.", + "target_collection": "TravelDestinations", + "search_query": "Explore scenic vistas and vibrant cultures", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find popular travel destinations with descriptions that include scenic vistas and vibrant cultures, and group these destinations by their destinationName.", + "target_collection": "TravelDestinations", + "search_query": "scenic vistas and vibrant cultures", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "popularity", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 212, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that are popular and include descriptions related to 'tropical beaches and adventure sports'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that are popular and include descriptions related to 'tropical beaches and adventure sports'.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that include descriptions related to 'tropical beaches and adventure sports' within the destinationDescription.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that are popular and include descriptions related to 'tropical beaches and adventure sports'.", + "target_collection": "TravelDestinations", + "search_query": "tropical beaches and adventure sports", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 213, + "database_schema_index": 3, + "natural_language_query": "Identify travel packages providing a relaxing beach holiday (using search_query on packageDetails). Within these, calculate the average packagePrice (using int_property_aggregation on packagePrice), and group the results by whether there is a discountAvailable (using groupby on discountAvailable).", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Identify travel packages providing a relaxing beach holiday (using search_query on packageDetails). Within these, calculate the average packagePrice (using int_property_aggregation on packagePrice), and group the results by whether there is a discountAvailable (using groupby on discountAvailable).", + "target_collection": "TravelPackages", + "search_query": "Find travel packages that offer a relaxing beach holiday", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify travel packages providing a relaxing beach holiday (using search_query on packageDetails). Within these, calculate the average packagePrice (using int_property_aggregation on packagePrice), and group the results by whether there is a discountAvailable (using groupby on discountAvailable).", + "target_collection": "TravelPackages", + "search_query": "relaxing beach holiday", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 214, + "database_schema_index": 3, + "natural_language_query": "What is the average cost of visiting tropical beach resorts described in detail?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What is the average cost of visiting tropical beach resorts described in detail?", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that match the detailed description of tropical beach resorts.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average cost of visiting tropical beach resorts described in detail?", + "target_collection": "Resorts", + "search_query": "tropical beach resorts", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 215, + "database_schema_index": 3, + "natural_language_query": "List travel destinations matching a description of 'tropical beaches', count the different destination names, and group results by whether they are popular to see which group has more destinations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "List travel destinations matching a description of 'tropical beaches', count the different destination names, and group results by whether they are popular to see which group has more destinations.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that best match the description 'tropical beaches'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 216, + "database_schema_index": 3, + "natural_language_query": "Find destinations that are conceptually similar to 'romantic getaway with beach access', and also list the top 5 most common destination names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find destinations that are conceptually similar to 'romantic getaway with beach access', and also list the top 5 most common destination names.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations that are conceptually similar to 'romantic getaway with beach access'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='TOP_OCCURRENCES', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 217, + "database_schema_index": 3, + "natural_language_query": "What percentage of destinations, grouped by destination names, are popular among tourists, and which of these have similar descriptions to 'romantic beaches with vibrant nightlife'? Please find matching entries using semantic search, and analyze the proportion of those considered popular using boolean property aggregation for the 'popular' field.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What percentage of destinations, grouped by destination names, are popular among tourists, and which of these have similar descriptions to 'romantic beaches with vibrant nightlife'? Please find matching entries using semantic search, and analyze the proportion of those considered popular using boolean property aggregation for the 'popular' field.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations similar to 'romantic beaches with vibrant nightlife.'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='PERCENTAGE_TRUE', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 218, + "database_schema_index": 3, + "natural_language_query": "What percentage of travel destinations, that match snowy mountains and vibrant city life descriptions, are currently popular among tourists?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What percentage of travel destinations, that match snowy mountains and vibrant city life descriptions, are currently popular among tourists?", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that match descriptions of snowy mountains and vibrant city life.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What percentage of travel destinations, that match snowy mountains and vibrant city life descriptions, are currently popular among tourists?", + "target_collection": "TravelDestinations", + "search_query": "snowy mountains vibrant city life", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 219, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that match the theme 'tropical beach with vibrant nightlife', and group the results based on whether they are popular among tourists.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that match the theme 'tropical beach with vibrant nightlife', and group the results based on whether they are popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that match the query \"tropical beach with vibrant nightlife\".", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that match the theme 'tropical beach with vibrant nightlife', and group the results based on whether they are popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": "tropical beach with vibrant nightlife", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "popularityRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popularAmongTourists", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "popularAmongTourists", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 220, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that are conceptually similar to 'romantic nature getaways' based on the destinationDescription.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that are conceptually similar to 'romantic nature getaways' based on the destinationDescription.", + "target_collection": "TravelDestinations", + "search_query": "{\"destinationDescription\":{\"operator\":\"search_query\",\"value\":\"romantic nature getaways\"}}", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that are conceptually similar to 'romantic nature getaways' based on the destinationDescription.", + "target_collection": "Destinations", + "search_query": "romantic nature getaways", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 221, + "database_schema_index": 3, + "natural_language_query": "Count how many travel agents have more than 5 years of experience, and group them by their agentName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Count how many travel agents have more than 5 years of experience, and group them by their agentName.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "agentName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Count how many travel agents have more than 5 years of experience, and group them by their agentName.", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "experienceYears", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "agentName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 222, + "database_schema_index": 3, + "natural_language_query": "Find travel agents who have at least 10 years in yearsOfExperience and determine the average years of experience among all travel agents.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel agents who have at least 10 years in yearsOfExperience and determine the average years of experience among all travel agents.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel agents who have at least 10 years in yearsOfExperience and determine the average years of experience among all travel agents.", + "target_collection": "TravelAgents", + "search_query": "travel agents", + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 223, + "database_schema_index": 3, + "natural_language_query": "Find travel agents who have at least 5 years in yearsOfExperience, count how many travel agents share the same agentName, and categorize the results based on whether they are availableNow.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel agents who have at least 5 years in yearsOfExperience, count how many travel agents share the same agentName, and categorize the results based on whether they are availableNow.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "availableNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel agents who have at least 5 years in yearsOfExperience, count how many travel agents share the same agentName, and categorize the results based on whether they are availableNow.", + "target_collection": "TravelAgents", + "search_query": "", + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "agentName", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "availableNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "agentName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + }, + { + "query_index": 224, + "database_schema_index": 3, + "natural_language_query": "Show all travel agents with at least 5 years of experience and count the number of unique agentName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Show all travel agents with at least 5 years of experience and count the number of unique agentName.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 225, + "database_schema_index": 3, + "natural_language_query": "Find travel packages that cost no more than 2000 in packagePrice, group these results by packageName, and count the total number of packages with discounts by evaluating discountAvailable.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel packages that cost no more than 2000 in packagePrice, group these results by packageName, and count the total number of packages with discounts by evaluating discountAvailable.", + "target_collection": "TravelPackages", + "search_query": null, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<=", + "value": 2000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "packageName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel packages that cost no more than 2000 in packagePrice, group these results by packageName, and count the total number of packages with discounts by evaluating discountAvailable.", + "target_collection": "TravelPackages", + "search_query": "travel packages", + "limit": 5, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<=", + "value": 2000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "discountAvailable", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "packageName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 226, + "database_schema_index": 3, + "natural_language_query": "Find travel agents with at least 5 years of experience and count how many are available now.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel agents with at least 5 years of experience and count how many are available now.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel agents with at least 5 years of experience and count how many are available now.", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "availableNow", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "availableNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 227, + "database_schema_index": 3, + "natural_language_query": "Group travel agents by their yearsOfExperience and only include those that have more than 5 years in yearsOfExperience.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Group travel agents by their yearsOfExperience and only include those that have more than 5 years in yearsOfExperience.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "yearsOfExperience" + }, + "predicted_query": { + "corresponding_natural_language_query": "Group travel agents by their yearsOfExperience and only include those that have more than 5 years in yearsOfExperience.", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "yearsOfExperience", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 228, + "database_schema_index": 3, + "natural_language_query": "Find travel agents with at least 5 years of experience in yearsOfExperience.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel agents with at least 5 years of experience in yearsOfExperience.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel agents with at least 5 years of experience in yearsOfExperience.", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 229, + "database_schema_index": 3, + "natural_language_query": "Find travel packages where the packageDetails include the keyword 'luxury', then compute the average of packagePrice for packages where discountAvailable is true, and group the results based on whether a discount is available.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel packages where the packageDetails include the keyword 'luxury', then compute the average of packagePrice for packages where discountAvailable is true, and group the results based on whether a discount is available.", + "target_collection": "TravelPackages", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "packageDetails", + "operator": "LIKE", + "value": "luxury" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel packages where the packageDetails include the keyword 'luxury', then compute the average of packagePrice for packages where discountAvailable is true, and group the results based on whether a discount is available.", + "target_collection": "TravelPackages", + "search_query": "luxury", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "discountAvailable", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 230, + "database_schema_index": 3, + "natural_language_query": "Determine the average averageVisitCost for travel destinations where destinationDescription contains the keyword 'beach'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Determine the average averageVisitCost for travel destinations where destinationDescription contains the keyword 'beach'.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Determine the average averageVisitCost for travel destinations where destinationDescription contains the keyword 'beach'.", + "target_collection": "TravelDestinations", + "search_query": "beach", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 231, + "database_schema_index": 3, + "natural_language_query": "List all travel destinations where the destinationDescription mentions 'popular', count how many destinations have such a description, and group these results by destinationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "List all travel destinations where the destinationDescription mentions 'popular', count how many destinations have such a description, and group these results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "%popular%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 232, + "database_schema_index": 3, + "natural_language_query": "Find all destinations in TravelDestinations where the destinationDescription contains the word 'beach', and count how many such destinations exist.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find all destinations in TravelDestinations where the destinationDescription contains the word 'beach', and count how many such destinations exist.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "%beach%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 233, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations where the destinationDescription includes 'beach', group the results by destinationName and count how many of these destinations are popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations where the destinationDescription includes 'beach', group the results by destinationName and count how many of these destinations are popular.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations where the destinationDescription includes 'beach', group the results by destinationName and count how many of these destinations are popular.", + "target_collection": "TravelDestinations", + "search_query": "beach", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "popularity", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 234, + "database_schema_index": 3, + "natural_language_query": "Show me travel destinations that include 'Beach' in their destinationName and count how many of them are popular using the popular attribute.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Show me travel destinations that include 'Beach' in their destinationName and count how many of them are popular using the popular attribute.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "Beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Show me travel destinations that include 'Beach' in their destinationName and count how many of them are popular using the popular attribute.", + "target_collection": "TravelDestinations", + "search_query": "Beach", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "popular", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 235, + "database_schema_index": 3, + "natural_language_query": "Find all travel destinations where the destinationDescription contains the keyword 'beach', and group the results by whether or not the destination is popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find all travel destinations where the destinationDescription contains the keyword 'beach', and group the results by whether or not the destination is popular.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all travel destinations where the destinationDescription contains the keyword 'beach', and group the results by whether or not the destination is popular.", + "target_collection": "TravelDestinations", + "search_query": "beach", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "popular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 236, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations with descriptions that contain the keyword 'beaches' in destinationDescription.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations with descriptions that contain the keyword 'beaches' in destinationDescription.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "beaches" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "3 validation errors for IntPropertyFilter\nproperty_name\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\noperator\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\nvalue\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing" + }, + { + "query_index": 237, + "database_schema_index": 3, + "natural_language_query": "Find the average cost of all travel destinations that are popular, and group the results by each destination name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find the average cost of all travel destinations that are popular, and group the results by each destination name.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the average cost of all travel destinations that are popular, and group the results by each destination name.", + "target_collection": "TravelDestinations", + "search_query": "popular travel destinations", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "cost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 238, + "database_schema_index": 3, + "natural_language_query": "Find the total sum of packagePrice for all travel packages where discountAvailable is true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find the total sum of packagePrice for all travel packages where discountAvailable is true.", + "target_collection": "TravelPackages", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "discountAvailable", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the total sum of packagePrice for all travel packages where discountAvailable is true.", + "target_collection": "TravelPackages", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "discountAvailable", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 239, + "database_schema_index": 3, + "natural_language_query": "List and categorize all popular travel destinations by their names, and for each destination, count the number of detailed descriptions available, ensuring that only destinations currently popular among tourists are included.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "List and categorize all popular travel destinations by their names, and for each destination, count the number of detailed descriptions available, ensuring that only destinations currently popular among tourists are included.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "List and categorize all popular travel destinations by their names, and for each destination, count the number of detailed descriptions available, ensuring that only destinations currently popular among tourists are included.", + "target_collection": "TravelDestinations", + "search_query": "popular travel destinations", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isPopular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "detailedDescriptions", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 240, + "database_schema_index": 3, + "natural_language_query": "Retrieve destinations with destinationName that are currently popular, then count the number of unique destinationName values.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Retrieve destinations with destinationName that are currently popular, then count the number of unique destinationName values.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 241, + "database_schema_index": 3, + "natural_language_query": "Find me all travel packages where there is a discountAvailable, count how many packages have a discount and organize the results by packageName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find me all travel packages where there is a discountAvailable, count how many packages have a discount and organize the results by packageName.", + "target_collection": "TravelPackages", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "discountAvailable", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "packageName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find me all travel packages where there is a discountAvailable, count how many packages have a discount and organize the results by packageName.", + "target_collection": "TravelPackages", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "discountAvailable", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "discountAvailable", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "packageName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 242, + "database_schema_index": 3, + "natural_language_query": "Find all travel destinations where the destination is currently popular, and calculate the percentage of all travel destinations that are popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find all travel destinations where the destination is currently popular, and calculate the percentage of all travel destinations that are popular.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all travel destinations where the destination is currently popular, and calculate the percentage of all travel destinations that are popular.", + "target_collection": "TravelDestinations", + "search_query": "popular", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 243, + "database_schema_index": 3, + "natural_language_query": "Find popular travel destinations, where 'popular' equals true, and group results by 'destinationName'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find popular travel destinations, where 'popular' equals true, and group results by 'destinationName'.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find popular travel destinations, where 'popular' equals true, and group results by 'destinationName'.", + "target_collection": "TravelDestinations", + "search_query": "popular travel destinations", + "limit": 5, + "integer_property_filter": { + "property_name": "popular", + "operator": "=", + "value": 1 + }, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 244, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that are popular among tourists.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that are popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that are popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": "popular among tourists", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "popularity", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isPopular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 245, + "database_schema_index": 3, + "natural_language_query": "Count the number of travel agents grouped by their availability status, using the yearsOfExperience property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Count the number of travel agents grouped by their availability status, using the yearsOfExperience property.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "availableNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Count the number of travel agents grouped by their availability status, using the yearsOfExperience property.", + "target_collection": "TravelAgents", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "availabilityStatus", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + }, + { + "query_index": 246, + "database_schema_index": 3, + "natural_language_query": "What is the average yearsOfExperience for all travel agents in the TravelAgents collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What is the average yearsOfExperience for all travel agents in the TravelAgents collection?", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average yearsOfExperience for all travel agents in the TravelAgents collection?", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 247, + "database_schema_index": 3, + "natural_language_query": "What is the count of each travel destination name grouped by whether the destination is popular?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What is the count of each travel destination name grouped by whether the destination is popular?", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the count of each travel destination name grouped by whether the destination is popular?", + "target_collection": "TravelDestinations", + "search_query": "travel destination name", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 248, + "database_schema_index": 3, + "natural_language_query": "What is the most common destination name in the Travel Destinations collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What is the most common destination name in the Travel Destinations collection?", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the most common destination name in the Travel Destinations collection?", + "target_collection": "Travel Destinations", + "search_query": "destination name", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 249, + "database_schema_index": 3, + "natural_language_query": "Show the percentage of popular destinations for each destinationName by grouping the destinations and calculating how many are marked as popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Show the percentage of popular destinations for each destinationName by grouping the destinations and calculating how many are marked as popular.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 250, + "database_schema_index": 3, + "natural_language_query": "Count how many travel destinations are currently popular and calculate the percentage of popular destinations in the TravelDestinations collection.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Count how many travel destinations are currently popular and calculate the percentage of popular destinations in the TravelDestinations collection.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 251, + "database_schema_index": 3, + "natural_language_query": "Group all travel destinations by the boolean property popular and determine the averageVisitCost for each group to understand the cost difference between popular and non-popular destinations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Group all travel destinations by the boolean property popular and determine the averageVisitCost for each group to understand the cost difference between popular and non-popular destinations.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "Group all travel destinations by the boolean property popular and determine the averageVisitCost for each group to understand the cost difference between popular and non-popular destinations.", + "target_collection": "TravelDestinations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "popular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 252, + "database_schema_index": 3, + "natural_language_query": "Explore art pieces of significant historical relevance, filter those with a currentValuation greater than 1,000,000, calculate the average currentValuation, and group the results by their onDisplay status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Explore art pieces of significant historical relevance, filter those with a currentValuation greater than 1,000,000, calculate the average currentValuation, and group the results by their onDisplay status.", + "target_collection": "ArtPieces", + "search_query": "Explore art pieces of significant historical relevance", + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "onDisplay" + }, + "predicted_query": { + "corresponding_natural_language_query": "Explore art pieces of significant historical relevance, filter those with a currentValuation greater than 1,000,000, calculate the average currentValuation, and group the results by their onDisplay status.", + "target_collection": "ArtPieces", + "search_query": "significant historical relevance", + "limit": 5, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "onDisplay", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 253, + "database_schema_index": 3, + "natural_language_query": "Find the average currentValuation of art pieces with significant historical details in their artPieceHistory where the currentValuation is greater than 1,000,000.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find the average currentValuation of art pieces with significant historical details in their artPieceHistory where the currentValuation is greater than 1,000,000.", + "target_collection": "ArtPieces", + "search_query": "Explore notable art pieces with historical significance described in their artPieceHistory", + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the average currentValuation of art pieces with significant historical details in their artPieceHistory where the currentValuation is greater than 1,000,000.", + "target_collection": "ArtPieces", + "search_query": "significant historical details in their artPieceHistory", + "limit": 5, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 254, + "database_schema_index": 3, + "natural_language_query": "Explore exhibitions that feature modern art and innovative installations, focusing only on those with an averageVisitorCount above 100, grouped by the exhibitionTitle to identify how many unique exhibitions match this criterion.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Explore exhibitions that feature modern art and innovative installations, focusing only on those with an averageVisitorCount above 100, grouped by the exhibitionTitle to identify how many unique exhibitions match this criterion.", + "target_collection": "Exhibitions", + "search_query": "modern art and innovative installations", + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Explore exhibitions that feature modern art and innovative installations, focusing only on those with an averageVisitorCount above 100, grouped by the exhibitionTitle to identify how many unique exhibitions match this criterion.", + "target_collection": "Exhibitions", + "search_query": "modern art innovative installations", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 255, + "database_schema_index": 3, + "natural_language_query": "Find exhibitions with descriptions about exploring the influence of Impressionism, where the averageVisitorCount is greater than 500, and count unique exhibition titles.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions with descriptions about exploring the influence of Impressionism, where the averageVisitorCount is greater than 500, and count unique exhibition titles.", + "target_collection": "Exhibitions", + "search_query": "exploring the influence of Impressionism", + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions with descriptions about exploring the influence of Impressionism, where the averageVisitorCount is greater than 500, and count unique exhibition titles.", + "target_collection": "Exhibitions", + "search_query": "exploring the influence of Impressionism", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "title", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 256, + "database_schema_index": 4, + "natural_language_query": "Find top museums highlighting Renaissance art, where entry fees are no more than 20, group results by exhibitHighlights, and determine how many are open today.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find top museums highlighting Renaissance art, where entry fees are no more than 20, group results by exhibitHighlights, and determine how many are open today.", + "target_collection": "Museums", + "search_query": "Top museums highlighting Renaissance art", + "integer_property_filter": { + "property_name": "entryFee", + "operator": "<=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitHighlights" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find top museums highlighting Renaissance art, where entry fees are no more than 20, group results by exhibitHighlights, and determine how many are open today.", + "target_collection": "Museums", + "search_query": "highlighting Renaissance art", + "limit": 5, + "integer_property_filter": { + "property_name": "entryFee", + "operator": "<=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "exhibitHighlights", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 257, + "database_schema_index": 4, + "natural_language_query": "List exhibitions with cultural themes in their exhibitionDescription that have an averageVisitorCount greater than 100, and summarize how many of these exhibitions are currentlyRunning.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "List exhibitions with cultural themes in their exhibitionDescription that have an averageVisitorCount greater than 100, and summarize how many of these exhibitions are currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": "cultural themes", + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "List exhibitions with cultural themes in their exhibitionDescription that have an averageVisitorCount greater than 100, and summarize how many of these exhibitions are currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": "cultural themes", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyRunning", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 258, + "database_schema_index": 4, + "natural_language_query": "Find museums where the exhibit highlights emphasize historical significance, filter for museums with entry fees exceeding 10, and group the results by each museum's name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums where the exhibit highlights emphasize historical significance, filter for museums with entry fees exceeding 10, and group the results by each museum's name.", + "target_collection": "Museums", + "search_query": "exhibitHighlights", + "integer_property_filter": { + "property_name": "entryFee", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums where the exhibit highlights emphasize historical significance, filter for museums with entry fees exceeding 10, and group the results by each museum's name.", + "target_collection": "Museums", + "search_query": "exhibit highlights emphasize historical significance", + "limit": 5, + "integer_property_filter": { + "property_name": "entryFees", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 259, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibitHighlights relevant to 'Impressionist art' that also have an entryFee greater than $10.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibitHighlights relevant to 'Impressionist art' that also have an entryFee greater than $10.", + "target_collection": "Museums", + "search_query": "Impressionist art", + "integer_property_filter": { + "property_name": "entryFee", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibitHighlights relevant to 'Impressionist art' that also have an entryFee greater than $10.", + "target_collection": "Museums", + "search_query": "exhibitHighlights relevant to 'Impressionist art'", + "limit": 5, + "integer_property_filter": { + "property_name": "entryFee", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "entryFee", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 260, + "database_schema_index": 4, + "natural_language_query": "Search for art pieces with significant historical relevance using their artPieceHistory, filter for those that have 'Monet' in artPieceName, calculate the average of currentValuation, and group the results by their onDisplay status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Search for art pieces with significant historical relevance using their artPieceHistory, filter for those that have 'Monet' in artPieceName, calculate the average of currentValuation, and group the results by their onDisplay status.", + "target_collection": "ArtPieces", + "search_query": "Find artworks with significant historical relevance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceName", + "operator": "LIKE", + "value": "%Monet%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "onDisplay" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for art pieces with significant historical relevance using their artPieceHistory, filter for those that have 'Monet' in artPieceName, calculate the average of currentValuation, and group the results by their onDisplay status.", + "target_collection": "ArtPieces", + "search_query": "art pieces with significant historical relevance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceName", + "operator": "LIKE", + "value": "Monet" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "onDisplay", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 261, + "database_schema_index": 4, + "natural_language_query": "Search for museums whose exhibitHighlights semantically match 'famous art exhibits with rich historical significance', where museumName is exactly 'Louvre', and compute the sum of entryFee.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Search for museums whose exhibitHighlights semantically match 'famous art exhibits with rich historical significance', where museumName is exactly 'Louvre', and compute the sum of entryFee.", + "target_collection": "Museums", + "search_query": "explore famous art exhibits with rich historical significance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "=", + "value": "Louvre" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for museums whose exhibitHighlights semantically match 'famous art exhibits with rich historical significance', where museumName is exactly 'Louvre', and compute the sum of entryFee.", + "target_collection": "Museums", + "search_query": "famous art exhibits with rich historical significance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "=", + "value": "Louvre" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 262, + "database_schema_index": 4, + "natural_language_query": "Retrieve museums with exhibit highlights similar to 'ancient artifacts', filter specifically on museums named 'Smithsonian', count the unique exhibit highlights available, and group the results by the museum name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Retrieve museums with exhibit highlights similar to 'ancient artifacts', filter specifically on museums named 'Smithsonian', count the unique exhibit highlights available, and group the results by the museum name.", + "target_collection": "Museums", + "search_query": "Find museums with exhibit highlights similar to 'ancient artifacts'.", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "=", + "value": "Smithsonian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 263, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions that focus on impressionist themes, check if they are currently running, and count the total number of distinct exhibition titles.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions that focus on impressionist themes, check if they are currently running, and count the total number of distinct exhibition titles.", + "target_collection": "Exhibitions", + "search_query": "Explore exhibitions that focus on impressionist themes in exhibitionDescription", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 264, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibits highlighting the historical significance of Vincent van Gogh's pieces using semantic search, filter for museums whose names include 'National', aggregate by counting the number of museums open today, and group results by museumName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibits highlighting the historical significance of Vincent van Gogh's pieces using semantic search, filter for museums whose names include 'National', aggregate by counting the number of museums open today, and group results by museumName.", + "target_collection": "Museums", + "search_query": "historical significance of Vincent van Gogh's pieces", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "LIKE", + "value": "National" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibits highlighting the historical significance of Vincent van Gogh's pieces using semantic search, filter for museums whose names include 'National', aggregate by counting the number of museums open today, and group results by museumName.", + "target_collection": "Museums", + "search_query": "exhibits highlighting the historical significance of Vincent van Gogh's pieces", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "LIKE", + "value": "National" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "museumName", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 265, + "database_schema_index": 4, + "natural_language_query": "Find museums that are most relevant to \"historical importance\" based on exhibitHighlights. Include only those museums where the museumName contains \"Art Gallery\", and show the percentage of these that are openToday.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums that are most relevant to \"historical importance\" based on exhibitHighlights. Include only those museums where the museumName contains \"Art Gallery\", and show the percentage of these that are openToday.", + "target_collection": "Museums", + "search_query": "historical importance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "LIKE", + "value": "Art Gallery" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums that are most relevant to \"historical importance\" based on exhibitHighlights. Include only those museums where the museumName contains \"Art Gallery\", and show the percentage of these that are openToday.", + "target_collection": "Museums", + "search_query": "historical importance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "LIKE", + "value": "Art Gallery" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 266, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions that are about modern art with innovative displays by looking at the exhibition descriptions. Filter these exhibitions to include only those with 'Masterpiece' in their titles. Then, group the results based on whether the exhibitions are currently running or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions that are about modern art with innovative displays by looking at the exhibition descriptions. Filter these exhibitions to include only those with 'Masterpiece' in their titles. Then, group the results based on whether the exhibitions are currently running or not.", + "target_collection": "Exhibitions", + "search_query": "Discover exhibitions about modern art with a focus on innovative displays", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitionTitle", + "operator": "LIKE", + "value": "Masterpiece" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions that are about modern art with innovative displays by looking at the exhibition descriptions. Filter these exhibitions to include only those with 'Masterpiece' in their titles. Then, group the results based on whether the exhibitions are currently running or not.", + "target_collection": "Exhibitions", + "search_query": "modern art with innovative displays", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "title", + "operator": "LIKE", + "value": "Masterpiece" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 267, + "database_schema_index": 4, + "natural_language_query": "Which museums, including those with names similar to 'Art Museum', have collections described as having significant cultural impact?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Which museums, including those with names similar to 'Art Museum', have collections described as having significant cultural impact?", + "target_collection": "Museums", + "search_query": "The cultural significance of the museum's collection and unique exhibits that attract thousands of visitors.", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "LIKE", + "value": "*Art Museum*" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Which museums, including those with names similar to 'Art Museum', have collections described as having significant cultural impact?", + "target_collection": "Museums", + "search_query": "museums with names similar to 'Art Museum' and collections described as having significant cultural impact", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "collection.size", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 268, + "database_schema_index": 4, + "natural_language_query": "What are the museums, grouped by their names, that have exhibit highlights including renaissance art and are open today, along with the sum of their entry fees?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "What are the museums, grouped by their names, that have exhibit highlights including renaissance art and are open today, along with the sum of their entry fees?", + "target_collection": "Museums", + "search_query": "exhibitHighlights including 'renaissance art'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the museums, grouped by their names, that have exhibit highlights including renaissance art and are open today, along with the sum of their entry fees?", + "target_collection": "Museums", + "search_query": "exhibit highlights including renaissance art", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 269, + "database_schema_index": 4, + "natural_language_query": "Find currently running exhibitions that explore the theme of Renaissance art and calculate the average visitor count.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find currently running exhibitions that explore the theme of Renaissance art and calculate the average visitor count.", + "target_collection": "Exhibitions", + "search_query": "Explore the theme of Renaissance art.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find currently running exhibitions that explore the theme of Renaissance art and calculate the average visitor count.", + "target_collection": "Exhibitions", + "search_query": "Renaissance art", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isCurrentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 270, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions with thematic content related to 'contemporary art' that are currently running, categorize them by exhibitionTitle, and count the number of occurrences of each exhibitionTitle.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions with thematic content related to 'contemporary art' that are currently running, categorize them by exhibitionTitle, and count the number of occurrences of each exhibitionTitle.", + "target_collection": "Exhibitions", + "search_query": "contemporary art", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions with thematic content related to 'contemporary art' that are currently running, categorize them by exhibitionTitle, and count the number of occurrences of each exhibitionTitle.", + "target_collection": "Exhibitions", + "search_query": "contemporary art", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitionTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 271, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibits that have historical significance and are open today, and count the number of unique museum names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibits that have historical significance and are open today, and count the number of unique museum names.", + "target_collection": "Museums", + "search_query": "Search for museums that have exhibits with historical significance in their exhibitHighlights", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 272, + "database_schema_index": 4, + "natural_language_query": "Explore museums with notable exhibit highlights that include ancient history artifacts, find which ones are open today, count the total number of museums open today, and segment the results by the museum name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Explore museums with notable exhibit highlights that include ancient history artifacts, find which ones are open today, count the total number of museums open today, and segment the results by the museum name.", + "target_collection": "Museums", + "search_query": "Explore museums with notable exhibitHighlights that include ancient history artifacts", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Explore museums with notable exhibit highlights that include ancient history artifacts, find which ones are open today, count the total number of museums open today, and segment the results by the museum name.", + "target_collection": "Museums", + "search_query": "notable exhibit highlights ancient history artifacts", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 273, + "database_schema_index": 4, + "natural_language_query": "Find museums that have notable exhibits with historical significance, indicate if they are open today, and provide the percentage of museums that are indeed open today.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums that have notable exhibits with historical significance, indicate if they are open today, and provide the percentage of museums that are indeed open today.", + "target_collection": "Museums", + "search_query": "exhibitHighlights", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums that have notable exhibits with historical significance, indicate if they are open today, and provide the percentage of museums that are indeed open today.", + "target_collection": "Museums", + "search_query": "notable exhibits with historical significance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 274, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibits related to the Renaissance that are open today, and group the results by the museum's name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibits related to the Renaissance that are open today, and group the results by the museum's name.", + "target_collection": "Museums", + "search_query": "Renaissance exhibits", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibits related to the Renaissance that are open today, and group the results by the museum's name.", + "target_collection": "Museums", + "search_query": "exhibits related to the Renaissance", + "limit": 5, + "integer_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": 1 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 275, + "database_schema_index": 4, + "natural_language_query": "Find museums that highlight Renaissance art exhibits using semantic search on the exhibitHighlights property and filter to only those where openToday is true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums that highlight Renaissance art exhibits using semantic search on the exhibitHighlights property and filter to only those where openToday is true.", + "target_collection": "Museums", + "search_query": "Find museums that highlight Renaissance art exhibits", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums that highlight Renaissance art exhibits using semantic search on the exhibitHighlights property and filter to only those where openToday is true.", + "target_collection": "Museums", + "search_query": "Renaissance art exhibits", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitHighlights", + "operator": "LIKE", + "value": "%Renaissance art exhibits%" + }, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 276, + "database_schema_index": 4, + "natural_language_query": "Find museums that have Impressionist art mentioned in their exhibitHighlights, calculate the average entryFee, and group results based on whether they are openToday.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums that have Impressionist art mentioned in their exhibitHighlights, calculate the average entryFee, and group results based on whether they are openToday.", + "target_collection": "Museums", + "search_query": "Explore museums showcasing Impressionist art in their exhibitHighlights.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums that have Impressionist art mentioned in their exhibitHighlights, calculate the average entryFee, and group results based on whether they are openToday.", + "target_collection": "Museums", + "search_query": "Impressionist art", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 277, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions focused on impressionism and calculate the total average visitor count using the averageVisitorCount property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions focused on impressionism and calculate the total average visitor count using the averageVisitorCount property.", + "target_collection": "Exhibitions", + "search_query": "Explore exhibitions focusing on impressionism.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions focused on impressionism and calculate the total average visitor count using the averageVisitorCount property.", + "target_collection": "Exhibitions", + "search_query": "impressionism", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 278, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibits about Renaissance art, categorize the results by their entryFee, and show the 5 most common exhibitHighlights.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibits about Renaissance art, categorize the results by their entryFee, and show the 5 most common exhibitHighlights.", + "target_collection": "Museums", + "search_query": "Search for museums that have exhibits about Renaissance art.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "entryFee" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibits about Renaissance art, categorize the results by their entryFee, and show the 5 most common exhibitHighlights.", + "target_collection": "Museums", + "search_query": "exhibits about Renaissance art", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "MEAN" + }, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "entryFee", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 279, + "database_schema_index": 4, + "natural_language_query": "Which museums have the most notable exhibit highlights according to their exhibitHighlights description, and how many distinct museum names are there?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Which museums have the most notable exhibit highlights according to their exhibitHighlights description, and how many distinct museum names are there?", + "target_collection": "Museums", + "search_query": "Find museums with notable exhibits mentioned in exhibitHighlights", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 280, + "database_schema_index": 4, + "natural_language_query": "Identify exhibitions focusing on historical themes, group them by their current status of being open to the public, and compute the percentage of exhibitions that are currently running.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Identify exhibitions focusing on historical themes, group them by their current status of being open to the public, and compute the percentage of exhibitions that are currently running.", + "target_collection": "Exhibitions", + "search_query": "Explore exhibitions with themes of historical significance in their exhibitionDescription.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyRunning", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "currentlyRunning" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 281, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibitions related to the Renaissance period and count how many of these museums are open today.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibitions related to the Renaissance period and count how many of these museums are open today.", + "target_collection": "Museums", + "search_query": "Discover museums with exhibitions related to the Renaissance period in their exhibitHighlights property.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibitions related to the Renaissance period and count how many of these museums are open today.", + "target_collection": "Museums", + "search_query": "exhibitions related to the Renaissance period", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "totalCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 282, + "database_schema_index": 4, + "natural_language_query": "Find museums where the exhibitHighlights mention ancient artifacts and group the results by whether they are openToday.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums where the exhibitHighlights mention ancient artifacts and group the results by whether they are openToday.", + "target_collection": "Museums", + "search_query": "Find museums where exhibitHighlights mention ancient artifacts", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums where the exhibitHighlights mention ancient artifacts and group the results by whether they are openToday.", + "target_collection": "Museums", + "search_query": "ancient artifacts", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "openToday", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 283, + "database_schema_index": 4, + "natural_language_query": "What are the museums with exhibit highlights focusing on ancient civilizations?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "What are the museums with exhibit highlights focusing on ancient civilizations?", + "target_collection": "Museums", + "search_query": "Find museums with exhibit highlights related to ancient civilizations", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "3 validation errors for IntPropertyFilter\nproperty_name\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\noperator\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\nvalue\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing" + }, + { + "query_index": 284, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions where the averageVisitorCount is at least 100, group them by exhibitionTitle, and compute the mean averageVisitorCount for each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is at least 100, group them by exhibitionTitle, and compute the mean averageVisitorCount for each group.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">=", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is at least 100, group them by exhibitionTitle, and compute the mean averageVisitorCount for each group.", + "target_collection": "Exhibitions", + "search_query": "", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">=", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 285, + "database_schema_index": 4, + "natural_language_query": "Find all exhibitions where the averageVisitorCount is greater than 500, and calculate the total sum of averageVisitorCount for these exhibitions.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find all exhibitions where the averageVisitorCount is greater than 500, and calculate the total sum of averageVisitorCount for these exhibitions.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntPropertyFilter\noperator\n Field required [type=missing, input_value={'property_name': 'averag...or(': '>', 'value': 500}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing" + }, + { + "query_index": 286, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 200, count the number of different exhibition titles, and group the results by whether the exhibition is currentlyRunning.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 200, count the number of different exhibition titles, and group the results by whether the exhibition is currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 200 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 200, count the number of different exhibition titles, and group the results by whether the exhibition is currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 200 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "exhibitionTitle", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyRunning", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "currentlyRunning", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 287, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 1000 and count how many unique exhibitionDescription texts there are.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 1000 and count how many unique exhibitionDescription texts there are.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 1000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 1000 and count how many unique exhibitionDescription texts there are.", + "target_collection": "Exhibitions", + "search_query": "", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 1000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitionDescription", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionDescription", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + }, + { + "query_index": 288, + "database_schema_index": 4, + "natural_language_query": "Find museums where the entryFee is 15 or less, aggregate the percentage of museums that are openToday, and group the results by museumName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums where the entryFee is 15 or less, aggregate the percentage of museums that are openToday, and group the results by museumName.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": { + "property_name": "entryFee", + "operator": "<=", + "value": 15 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums where the entryFee is 15 or less, aggregate the percentage of museums that are openToday, and group the results by museumName.", + "target_collection": "Museums", + "search_query": "", + "limit": 5, + "integer_property_filter": { + "property_name": "entryFee", + "operator": "<=", + "value": 15 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 289, + "database_schema_index": 4, + "natural_language_query": "Find art pieces from ArtPieces with a currentValuation of at least 1,000,000 and count how many of these are onDisplay.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find art pieces from ArtPieces with a currentValuation of at least 1,000,000 and count how many of these are onDisplay.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">=", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find art pieces from ArtPieces with a currentValuation of at least 1,000,000 and count how many of these are onDisplay.", + "target_collection": "ArtPieces", + "search_query": "", + "limit": 5, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">=", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "onDisplay", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "onDisplay", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 290, + "database_schema_index": 4, + "natural_language_query": "Show exhibitions where the averageVisitorCount is greater than or equal to 100, and group the results by the currentlyRunning status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Show exhibitions where the averageVisitorCount is greater than or equal to 100, and group the results by the currentlyRunning status.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">=", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show exhibitions where the averageVisitorCount is greater than or equal to 100, and group the results by the currentlyRunning status.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">=", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 291, + "database_schema_index": 4, + "natural_language_query": "Find art pieces with a currentValuation greater than 1,000,000.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find art pieces with a currentValuation greater than 1,000,000.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find art pieces with a currentValuation greater than 1,000,000.", + "target_collection": "ArtPieces", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 292, + "database_schema_index": 4, + "natural_language_query": "For museums that are currently open, calculate the average entry fee grouped by the name of the museum.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "For museums that are currently open, calculate the average entry fee grouped by the name of the museum.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "For museums that are currently open, calculate the average entry fee grouped by the name of the museum.", + "target_collection": "Museums", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageEntryFee", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.65, + "error": null + }, + { + "query_index": 293, + "database_schema_index": 4, + "natural_language_query": "Find the average currentValuation of all art pieces in the ArtPieces collection whose artPieceHistory contains the word 'Renaissance'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find the average currentValuation of all art pieces in the ArtPieces collection whose artPieceHistory contains the word 'Renaissance'.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceHistory", + "operator": "LIKE", + "value": "Renaissance" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the average currentValuation of all art pieces in the ArtPieces collection whose artPieceHistory contains the word 'Renaissance'.", + "target_collection": "ArtPieces", + "search_query": "Renaissance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 294, + "database_schema_index": 4, + "natural_language_query": "Count the number of unique museums with exhibitHighlights containing 'historical significance' and group these counts by whether or not the museum is open today.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Count the number of unique museums with exhibitHighlights containing 'historical significance' and group these counts by whether or not the museum is open today.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitHighlights", + "operator": "LIKE", + "value": "historical significance" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 295, + "database_schema_index": 4, + "natural_language_query": "Find art pieces where \"Monet\" is mentioned in artPieceHistory, and count the number of unique artPieceName values.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find art pieces where \"Monet\" is mentioned in artPieceHistory, and count the number of unique artPieceName values.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceHistory", + "operator": "LIKE", + "value": "Monet" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 296, + "database_schema_index": 4, + "natural_language_query": "Find museums where exhibitHighlights contain the keyword 'ancient artifacts', calculate what percentage of these museums are openToday, and group the museums by entryFee to see the distribution across different price categories.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums where exhibitHighlights contain the keyword 'ancient artifacts', calculate what percentage of these museums are openToday, and group the museums by entryFee to see the distribution across different price categories.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitHighlights", + "operator": "LIKE", + "value": "ancient artifacts" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "entryFee" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums where exhibitHighlights contain the keyword 'ancient artifacts', calculate what percentage of these museums are openToday, and group the museums by entryFee to see the distribution across different price categories.", + "target_collection": "Museums", + "search_query": "ancient artifacts", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "entryFee", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 297, + "database_schema_index": 4, + "natural_language_query": "Find museums that mention 'renaissance' in their exhibitHighlights and count how many of them are open today.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums that mention 'renaissance' in their exhibitHighlights and count how many of them are open today.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitHighlights", + "operator": "LIKE", + "value": "renaissance" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums that mention 'renaissance' in their exhibitHighlights and count how many of them are open today.", + "target_collection": "Museums", + "search_query": "renaissance", + "limit": 5, + "integer_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": 1 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 298, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions where the exhibitionTitle contains 'Impressionism' and group the results by currentlyRunning status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions where the exhibitionTitle contains 'Impressionism' and group the results by currentlyRunning status.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitionTitle", + "operator": "LIKE", + "value": "Impressionism" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "3 validation errors for IntPropertyFilter\nproperty_name\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\noperator\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\nvalue\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing" + }, + { + "query_index": 299, + "database_schema_index": 4, + "natural_language_query": "Find art pieces where the artPieceName contains the word 'Starry'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find art pieces where the artPieceName contains the word 'Starry'.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceName", + "operator": "LIKE", + "value": "%Starry%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find art pieces where the artPieceName contains the word 'Starry'.", + "target_collection": "ArtPieces", + "search_query": "artPieceName STAR", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 300, + "database_schema_index": 4, + "natural_language_query": "Find a summary of the total averageVisitorCount for each exhibitionTitle where the exhibition is currentlyRunning.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find a summary of the total averageVisitorCount for each exhibitionTitle where the exhibition is currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find a summary of the total averageVisitorCount for each exhibitionTitle where the exhibition is currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": "exhibitionTitle", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 301, + "database_schema_index": 4, + "natural_language_query": "Find all art pieces that are on display and calculate the total current valuation of these pieces using the `onDisplay` property for filtering and `currentValuation` property for aggregation.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find all art pieces that are on display and calculate the total current valuation of these pieces using the `onDisplay` property for filtering and `currentValuation` property for aggregation.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "onDisplay", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all art pieces that are on display and calculate the total current valuation of these pieces using the `onDisplay` property for filtering and `currentValuation` property for aggregation.", + "target_collection": "ArtPieces", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "onDisplay", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 302, + "database_schema_index": 4, + "natural_language_query": "Retrieve a list of all museums that are open today, group them by the museumName, and within each group, count the occurrence of each unique exhibitHighlights.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Retrieve a list of all museums that are open today, group them by the museumName, and within each group, count the occurrence of each unique exhibitHighlights.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Retrieve a list of all museums that are open today, group them by the museumName, and within each group, count the occurrence of each unique exhibitHighlights.", + "target_collection": "Museums", + "search_query": "museums that are open today", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 303, + "database_schema_index": 4, + "natural_language_query": "Find museums in the Museums collection that are open today (using the 'openToday' boolean property filter), and determine the most common exhibit highlights among them (using text property aggregation on 'exhibitHighlights').", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums in the Museums collection that are open today (using the 'openToday' boolean property filter), and determine the most common exhibit highlights among them (using text property aggregation on 'exhibitHighlights').", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums in the Museums collection that are open today (using the 'openToday' boolean property filter), and determine the most common exhibit highlights among them (using text property aggregation on 'exhibitHighlights').", + "target_collection": "Museums", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "openToday", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + }, + { + "query_index": 304, + "database_schema_index": 4, + "natural_language_query": "Show the percentage of exhibitions on 'exhibitionTitle' that are currently running. Group the results by exhibitionTitle to determine which specific exhibitions have the highest visitor count while currentlyRunning.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Show the percentage of exhibitions on 'exhibitionTitle' that are currently running. Group the results by exhibitionTitle to determine which specific exhibitions have the highest visitor count while currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyRunning", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show the percentage of exhibitions on 'exhibitionTitle' that are currently running. Group the results by exhibitionTitle to determine which specific exhibitions have the highest visitor count while currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": "exhibitionTitle", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentVisitorCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyRunning", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "exhibitionTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 305, + "database_schema_index": 4, + "natural_language_query": "Count how many exhibitions are currently open to the public and find those that are open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Count how many exhibitions are currently open to the public and find those that are open.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='TOTAL_TRUE', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 306, + "database_schema_index": 4, + "natural_language_query": "List all museums that are open today and group them by their entry fee.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "List all museums that are open today and group them by their entry fee.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "entryFee" + }, + "predicted_query": { + "corresponding_natural_language_query": "List all museums that are open today and group them by their entry fee.", + "target_collection": "Museums", + "search_query": "museums", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "entryFee", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 307, + "database_schema_index": 4, + "natural_language_query": "Find museums where the openToday flag is set to true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums where the openToday flag is set to true.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums where the openToday flag is set to true.", + "target_collection": "Museums", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 308, + "database_schema_index": 4, + "natural_language_query": "For each unique exhibitionTitle, determine the count of exhibitions that are currently running by aggregating over the currentlyRunning property and grouping the results by exhibitionTitle.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "For each unique exhibitionTitle, determine the count of exhibitions that are currently running by aggregating over the currentlyRunning property and grouping the results by exhibitionTitle.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "For each unique exhibitionTitle, determine the count of exhibitions that are currently running by aggregating over the currentlyRunning property and grouping the results by exhibitionTitle.", + "target_collection": "Exhibitions", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyRunning", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "exhibitionTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 309, + "database_schema_index": 4, + "natural_language_query": "What is the mean of the averageVisitorCount in the Exhibitions collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "What is the mean of the averageVisitorCount in the Exhibitions collection?", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the mean of the averageVisitorCount in the Exhibitions collection?", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 310, + "database_schema_index": 4, + "natural_language_query": "What are the top 5 most common exhibit highlights in terms of descriptions for museums, grouped by each museum's name?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "What are the top 5 most common exhibit highlights in terms of descriptions for museums, grouped by each museum's name?", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='TOP_OCCURRENCES', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 311, + "database_schema_index": 4, + "natural_language_query": "What is the count of unique museum names in the Museums collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "What is the count of unique museum names in the Museums collection?", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 312, + "database_schema_index": 4, + "natural_language_query": "Find out how many museums are open today and group this information by museumName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find out how many museums are open today and group this information by museumName.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find out how many museums are open today and group this information by museumName.", + "target_collection": "Museums", + "search_query": "museums open today", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 313, + "database_schema_index": 4, + "natural_language_query": "Calculate the percentage of museums that are open today based on the openToday property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Calculate the percentage of museums that are open today based on the openToday property.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate the percentage of museums that are open today based on the openToday property.", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 314, + "database_schema_index": 4, + "natural_language_query": "Organize museums based on whether they are open today and calculate the average entry fee for each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Organize museums based on whether they are open today and calculate the average entry fee for each group.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday" + }, + "predicted_query": { + "corresponding_natural_language_query": "Organize museums based on whether they are open today and calculate the average entry fee for each group.", + "target_collection": "Museums", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + } + ] +} \ No newline at end of file diff --git a/src/test_gorilla/grok-2-latest-02-21-25.json b/src/test_gorilla/grok-2-latest-02-21-25.json new file mode 100644 index 0000000..8abf6c6 --- /dev/null +++ b/src/test_gorilla/grok-2-latest-02-21-25.json @@ -0,0 +1,47008 @@ +{ + "timestamp": "2025-02-21T11:33:56.874233", + "model_name": "grok-2-latest", + "generate_with_models": false, + "total_queries": 315, + "successful_predictions": 304, + "failed_predictions": 11, + "average_ast_score": 0.889720394736842, + "perfect_matches": 187, + "per_schema_scores": { + "0": 0.8835937500000003, + "1": 0.8882812500000001, + "2": 0.8746093749999998, + "3": 0.7546875000000003 + }, + "detailed_results": [ + { + "query_index": 0, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine, where the average rating is at least 4, count how many such restaurants there are, and group them by whether they are currently open or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine, where the average rating is at least 4, count how many such restaurants there are, and group them by whether they are currently open or not.", + "target_collection": "Restaurants", + "search_query": "Find restaurants with a cozy ambiance and Italian cuisine", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine, where the average rating is at least 4, count how many such restaurants there are, and group them by whether they are currently open or not.", + "target_collection": "Restaurants", + "search_query": "cozy ambiance Italian cuisine", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 1, + "database_schema_index": 0, + "natural_language_query": "Find Italian cuisine restaurants with a cozy ambiance that have an average rating of at least 4, plus provide the count of such restaurants that are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find Italian cuisine restaurants with a cozy ambiance that have an average rating of at least 4, plus provide the count of such restaurants that are currently open.", + "target_collection": "Restaurants", + "search_query": "Find restaurants with cozy ambiance and Italian cuisine", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find Italian cuisine restaurants with a cozy ambiance that have an average rating of at least 4, plus provide the count of such restaurants that are currently open.", + "target_collection": "Restaurants", + "search_query": "Italian cuisine restaurants with a cozy ambiance", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 2, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that match the description 'authentic Italian ambiance', have an averageRating greater than 4, list the top 5 most common restaurant names in this set, and partition the results based on whether the restaurant is currently open or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that match the description 'authentic Italian ambiance', have an averageRating greater than 4, list the top 5 most common restaurant names in this set, and partition the results based on whether the restaurant is currently open or not.", + "target_collection": "Restaurants", + "search_query": "authentic Italian ambiance", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that match the description 'authentic Italian ambiance', have an averageRating greater than 4, list the top 5 most common restaurant names in this set, and partition the results based on whether the restaurant is currently open or not.", + "target_collection": "Restaurants", + "search_query": "authentic Italian ambiance", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 3, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with a family-friendly ambiance and Italian cuisine rated with at least 4.5 in averageRating, and identify the top 3 most common descriptions.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with a family-friendly ambiance and Italian cuisine rated with at least 4.5 in averageRating, and identify the top 3 most common descriptions.", + "target_collection": "Restaurants", + "search_query": "Find restaurants with a family-friendly ambiance and Italian cuisine", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with a family-friendly ambiance and Italian cuisine rated with at least 4.5 in averageRating, and identify the top 3 most common descriptions.", + "target_collection": "Restaurants", + "search_query": "family-friendly ambiance Italian cuisine", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 4, + "database_schema_index": 0, + "natural_language_query": "Find restaurants offering Italian cuisine with a cozy atmosphere, with at least an average rating of 4.5. Also, calculate the percentage of these restaurants that are open and group results based on their open status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants offering Italian cuisine with a cozy atmosphere, with at least an average rating of 4.5. Also, calculate the percentage of these restaurants that are open and group results based on their open status.", + "target_collection": "Restaurants", + "search_query": "Find restaurants offering Italian cuisine with a cozy atmosphere", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants offering Italian cuisine with a cozy atmosphere, with at least an average rating of 4.5. Also, calculate the percentage of these restaurants that are open and group results based on their open status.", + "target_collection": "Restaurants", + "search_query": "Italian cuisine with a cozy atmosphere", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 5, + "database_schema_index": 0, + "natural_language_query": "Find Italian cuisine restaurants with descriptions containing 'Italian cuisine', with averageRating greater than 4.0, and calculate the percentage of these that are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find Italian cuisine restaurants with descriptions containing 'Italian cuisine', with averageRating greater than 4.0, and calculate the percentage of these that are currently open.", + "target_collection": "Restaurants", + "search_query": "Search for restaurants with descriptions containing 'Italian cuisine'", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find Italian cuisine restaurants with descriptions containing 'Italian cuisine', with averageRating greater than 4.0, and calculate the percentage of these that are currently open.", + "target_collection": "Restaurants", + "search_query": "Italian cuisine", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "Italian cuisine" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 6, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that are similar to Italian family-friendly places, have an averageRating of at least 4, and group them by whether they are currently open (openNow).", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that are similar to Italian family-friendly places, have an averageRating of at least 4, and group them by whether they are currently open (openNow).", + "target_collection": "Restaurants", + "search_query": "Italian, family-friendly ambiance", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that are similar to Italian family-friendly places, have an averageRating of at least 4, and group them by whether they are currently open (openNow).", + "target_collection": "Restaurants", + "search_query": "Italian family-friendly places", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">=", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 7, + "database_schema_index": 0, + "natural_language_query": "Find Italian restaurants with a cozy ambiance, and the averageRating must be greater than 4.0.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find Italian restaurants with a cozy ambiance, and the averageRating must be greater than 4.0.", + "target_collection": "Restaurants", + "search_query": "Looking for Italian restaurants with a cozy ambiance", + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find Italian restaurants with a cozy ambiance, and the averageRating must be greater than 4.0.", + "target_collection": "Restaurants", + "search_query": "Italian restaurants with a cozy ambiance", + "limit": 5, + "integer_property_filter": { + "property_name": "averageRating", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 8, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with an Italian ambiance and explicitly mentioned as family friendly in their description, calculate the average of each restaurant's averageRating, and group the results by restaurant name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with an Italian ambiance and explicitly mentioned as family friendly in their description, calculate the average of each restaurant's averageRating, and group the results by restaurant name.", + "target_collection": "Restaurants", + "search_query": "Italian ambiance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "family friendly" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with an Italian ambiance and explicitly mentioned as family friendly in their description, calculate the average of each restaurant's averageRating, and group the results by restaurant name.", + "target_collection": "Restaurants", + "search_query": "Italian ambiance family friendly", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 9, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that have a romantic ambiance using search query, filter the results to include only those where the name contains 'Ristorante', and count the number of these restaurants using the averageRating property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that have a romantic ambiance using search query, filter the results to include only those where the name contains 'Ristorante', and count the number of these restaurants using the averageRating property.", + "target_collection": "Restaurants", + "search_query": "romantic ambiance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "Ristorante" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that have a romantic ambiance using search query, filter the results to include only those where the name contains 'Ristorante', and count the number of these restaurants using the averageRating property.", + "target_collection": "Restaurants", + "search_query": "romantic ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "%Ristorante%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 10, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with a cozy and modern ambiance that mention 'casual dining' in their description. Count the number of unique restaurant names and group the results by whether they are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with a cozy and modern ambiance that mention 'casual dining' in their description. Count the number of unique restaurant names and group the results by whether they are currently open.", + "target_collection": "Restaurants", + "search_query": "Cozy and modern ambiance with festive atmosphere", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "%casual dining%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with a cozy and modern ambiance that mention 'casual dining' in their description. Count the number of unique restaurant names and group the results by whether they are currently open.", + "target_collection": "Restaurants", + "search_query": "cozy modern ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "casual dining" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1000000 + }, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 11, + "database_schema_index": 0, + "natural_language_query": "Search for restaurants similar in description and ambiance to those fitting the concept of cozy and modern cuisine, filter to only include restaurants named exactly 'Ocean View Grille', and count the occurrences of each restaurant name in the results.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Search for restaurants similar in description and ambiance to those fitting the concept of cozy and modern cuisine, filter to only include restaurants named exactly 'Ocean View Grille', and count the occurrences of each restaurant name in the results.", + "target_collection": "Restaurants", + "search_query": "Find the most relevant restaurants based on their description of the cuisine and ambiance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Ocean View Grille" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for restaurants similar in description and ambiance to those fitting the concept of cozy and modern cuisine, filter to only include restaurants named exactly 'Ocean View Grille', and count the occurrences of each restaurant name in the results.", + "target_collection": "Restaurants", + "search_query": "cozy modern cuisine", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Ocean View Grille" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 12, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with a nature ambiance, having Italian cuisine in their description, calculate the percentage of restaurants currently open, and group them by their average rating to summarize.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with a nature ambiance, having Italian cuisine in their description, calculate the percentage of restaurants currently open, and group them by their average rating to summarize.", + "target_collection": "Restaurants", + "search_query": "nature ambiance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "Italian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with a nature ambiance, having Italian cuisine in their description, calculate the percentage of restaurants currently open, and group them by their average rating to summarize.", + "target_collection": "Restaurants", + "search_query": "nature ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description.cuisine", + "operator": "LIKE", + "value": "Italian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 13, + "database_schema_index": 0, + "natural_language_query": "Find restaurants similar to a cozy Italian restaurant with a great wine selection, include only those whose name contains 'Grill', and count how many of them are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants similar to a cozy Italian restaurant with a great wine selection, include only those whose name contains 'Grill', and count how many of them are currently open.", + "target_collection": "Restaurants", + "search_query": "A cozy Italian restaurant with a great wine selection", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "Grill" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants similar to a cozy Italian restaurant with a great wine selection, include only those whose name contains 'Grill', and count how many of them are currently open.", + "target_collection": "Restaurants", + "search_query": "cozy Italian restaurant with a great wine selection", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "%Grill%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 14, + "database_schema_index": 0, + "natural_language_query": "Find restaurants offering authentic Italian cuisine while they are open now, and group these restaurants by their average rating.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants offering authentic Italian cuisine while they are open now, and group these restaurants by their average rating.", + "target_collection": "Restaurants", + "search_query": "authentic Italian cuisine", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants offering authentic Italian cuisine while they are open now, and group these restaurants by their average rating.", + "target_collection": "Restaurants", + "search_query": "authentic Italian cuisine", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 15, + "database_schema_index": 0, + "natural_language_query": "Search for restaurants that are famous for Italian cuisine using semantic search for 'cuisine' and 'ambiance', and additionally filter to show only those whose description explicitly contains the word 'romantic'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Search for restaurants that are famous for Italian cuisine using semantic search for 'cuisine' and 'ambiance', and additionally filter to show only those whose description explicitly contains the word 'romantic'.", + "target_collection": "Restaurants", + "search_query": "Find restaurants known for Italian cuisine with a romantic ambiance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "romantic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for restaurants that are famous for Italian cuisine using semantic search for 'cuisine' and 'ambiance', and additionally filter to show only those whose description explicitly contains the word 'romantic'.", + "target_collection": "Restaurants", + "search_query": "Italian cuisine romantic ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "romantic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 16, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that offer a romantic ambiance and Italian cuisine, ensure they are open now, calculate the average rating, and organize the results by each restaurant's name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that offer a romantic ambiance and Italian cuisine, ensure they are open now, calculate the average rating, and organize the results by each restaurant's name.", + "target_collection": "Restaurants", + "search_query": "Find restaurants that offer a romantic ambiance and Italian cuisine", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that offer a romantic ambiance and Italian cuisine, ensure they are open now, calculate the average rating, and organize the results by each restaurant's name.", + "target_collection": "Restaurants", + "search_query": "romantic ambiance Italian cuisine", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 17, + "database_schema_index": 0, + "natural_language_query": "Find cozy Italian restaurants with a great wine selection that are open now, and calculate the average rating of these open restaurants.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find cozy Italian restaurants with a great wine selection that are open now, and calculate the average rating of these open restaurants.", + "target_collection": "Restaurants", + "search_query": "Looking for cozy Italian restaurants with a great wine selection", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find cozy Italian restaurants with a great wine selection that are open now, and calculate the average rating of these open restaurants.", + "target_collection": "Restaurants", + "search_query": "cozy Italian restaurants with a great wine selection", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 18, + "database_schema_index": 0, + "natural_language_query": "What are the romantic Italian restaurants that are currently open now, and what is the most common description among them, grouped by their name?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What are the romantic Italian restaurants that are currently open now, and what is the most common description among them, grouped by their name?", + "target_collection": "Restaurants", + "search_query": "Find restaurants matching 'romantic Italian dining'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the romantic Italian restaurants that are currently open now, and what is the most common description among them, grouped by their name?", + "target_collection": "Restaurants", + "search_query": "romantic Italian restaurants", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 19, + "database_schema_index": 0, + "natural_language_query": "Find restaurants offering Mediterranean cuisine with a cozy ambiance and are currently open, then list the top 5 most common restaurant names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants offering Mediterranean cuisine with a cozy ambiance and are currently open, then list the top 5 most common restaurant names.", + "target_collection": "Restaurants", + "search_query": "Explore Mediterranean cuisine with a cozy ambiance", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants offering Mediterranean cuisine with a cozy ambiance and are currently open, then list the top 5 most common restaurant names.", + "target_collection": "Restaurants", + "search_query": "Mediterranean cuisine with a cozy ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 20, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that are known for their cozy ambiance and Italian cuisine, filter those that are currently open, aggregate to count how many are open versus closed, and organize results by the name of the restaurant.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that are known for their cozy ambiance and Italian cuisine, filter those that are currently open, aggregate to count how many are open versus closed, and organize results by the name of the restaurant.", + "target_collection": "Restaurants", + "search_query": "Find restaurants that are known for their cozy ambiance and Italian cuisine.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that are known for their cozy ambiance and Italian cuisine, filter those that are currently open, aggregate to count how many are open versus closed, and organize results by the name of the restaurant.", + "target_collection": "Restaurants", + "search_query": "cozy ambiance Italian cuisine", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 21, + "database_schema_index": 0, + "natural_language_query": "Find restaurants serving Italian cuisine with a romantic ambiance that are currently open, and calculate the percentage of restaurants that are open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants serving Italian cuisine with a romantic ambiance that are currently open, and calculate the percentage of restaurants that are open.", + "target_collection": "Restaurants", + "search_query": "Find restaurants serving Italian cuisine with a romantic ambiance", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants serving Italian cuisine with a romantic ambiance that are currently open, and calculate the percentage of restaurants that are open.", + "target_collection": "Restaurants", + "search_query": "Italian cuisine romantic ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 22, + "database_schema_index": 0, + "natural_language_query": "Find cozy Italian restaurants that are currently open, and group them by their name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find cozy Italian restaurants that are currently open, and group them by their name.", + "target_collection": "Restaurants", + "search_query": "Find cozy Italian restaurants", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find cozy Italian restaurants that are currently open, and group them by their name.", + "target_collection": "Restaurants", + "search_query": "cozy Italian restaurants", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 23, + "database_schema_index": 0, + "natural_language_query": "Find currently open restaurants that conceptually relate to 'Italian cuisine with a cozy ambiance.'", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find currently open restaurants that conceptually relate to 'Italian cuisine with a cozy ambiance.'", + "target_collection": "Restaurants", + "search_query": "Find restaurants serving Italian cuisine with a cozy ambiance", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find currently open restaurants that conceptually relate to 'Italian cuisine with a cozy ambiance.'", + "target_collection": "Restaurants", + "search_query": "Italian cuisine with a cozy ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 24, + "database_schema_index": 0, + "natural_language_query": "What are the total party sizes of reservations that mention 'birthday' in notes, grouped by whether the reservation is confirmed?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What are the total party sizes of reservations that mention 'birthday' in notes, grouped by whether the reservation is confirmed?", + "target_collection": "Reservations", + "search_query": "Find reservations where the notes mention 'birthday'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "confirmed" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the total party sizes of reservations that mention 'birthday' in notes, grouped by whether the reservation is confirmed?", + "target_collection": "Reservations", + "search_query": "birthday", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "isConfirmed", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 25, + "database_schema_index": 0, + "natural_language_query": "What is the average price of spicy vegetarian menu items?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What is the average price of spicy vegetarian menu items?", + "target_collection": "Menus", + "search_query": "Find menu items with a description that matches 'spicy vegetarian options'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "price", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average price of spicy vegetarian menu items?", + "target_collection": "MenuItems", + "search_query": "spicy vegetarian", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "price", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 26, + "database_schema_index": 0, + "natural_language_query": "Identify romantic restaurants by analyzing descriptions for ambiance, count the number of unique restaurants, and group the results by whether they are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Identify romantic restaurants by analyzing descriptions for ambiance, count the number of unique restaurants, and group the results by whether they are currently open.", + "target_collection": "Restaurants", + "search_query": "Find restaurants that offer a romantic ambiance.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify romantic restaurants by analyzing descriptions for ambiance, count the number of unique restaurants, and group the results by whether they are currently open.", + "target_collection": "Restaurants", + "search_query": "romantic ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "id", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 27, + "database_schema_index": 0, + "natural_language_query": "Identify how many unique restaurants offer a cozy Italian cuisine with a romantic ambiance by analyzing their descriptions and count the occurrences of different restaurant names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Identify how many unique restaurants offer a cozy Italian cuisine with a romantic ambiance by analyzing their descriptions and count the occurrences of different restaurant names.", + "target_collection": "Restaurants", + "search_query": "Find restaurants with a description that matches 'cozy Italian cuisine with romantic ambiance'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify how many unique restaurants offer a cozy Italian cuisine with a romantic ambiance by analyzing their descriptions and count the occurrences of different restaurant names.", + "target_collection": "Restaurants", + "search_query": "cozy Italian cuisine with romantic ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10000 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 28, + "database_schema_index": 0, + "natural_language_query": "What percentage of restaurants that offer outdoor seating and live music are currently open, and how are they distributed by their average rating?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What percentage of restaurants that offer outdoor seating and live music are currently open, and how are they distributed by their average rating?", + "target_collection": "Restaurants", + "search_query": "Find restaurants that offer outdoor seating and live music.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "What percentage of restaurants that offer outdoor seating and live music are currently open, and how are they distributed by their average rating?", + "target_collection": "Restaurants", + "search_query": "restaurants with outdoor seating and live music", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 29, + "database_schema_index": 0, + "natural_language_query": "What percentage of confirmed reservations mention the word 'celebration' in the notes?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What percentage of confirmed reservations mention the word 'celebration' in the notes?", + "target_collection": "Reservations", + "search_query": "celebration", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "confirmed", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What percentage of confirmed reservations mention the word 'celebration' in the notes?", + "target_collection": "Reservations", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "confirmed", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "notes", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 30, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine in their description using search_query, and then group these restaurants by their averageRating.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine in their description using search_query, and then group these restaurants by their averageRating.", + "target_collection": "Restaurants", + "search_query": "restaurants with a cozy ambiance and Italian cuisine", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with a cozy ambiance and Italian cuisine in their description using search_query, and then group these restaurants by their averageRating.", + "target_collection": "Restaurants", + "search_query": "cozy ambiance Italian cuisine", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 31, + "database_schema_index": 0, + "natural_language_query": "Find restaurants described as having a cozy ambiance in their detailed description.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants described as having a cozy ambiance in their detailed description.", + "target_collection": "Restaurants", + "search_query": "{\"query\":\"Find restaurants with cozy ambiance.\"}", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants described as having a cozy ambiance in their detailed description.", + "target_collection": "Restaurants", + "search_query": "cozy ambiance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 32, + "database_schema_index": 0, + "natural_language_query": "Find reservations where the partySize is greater than 4, group the results by reservationName, and calculate the average partySize for each reservationName group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find reservations where the partySize is greater than 4, group the results by reservationName, and calculate the average partySize for each reservationName group.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find reservations where the partySize is greater than 4, group the results by reservationName, and calculate the average partySize for each reservationName group.", + "target_collection": "Reservations", + "search_query": "", + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 33, + "database_schema_index": 0, + "natural_language_query": "Find how many reservations have a partySize of at least 4 people and provide the total count.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find how many reservations have a partySize of at least 4 people and provide the total count.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find how many reservations have a partySize of at least 4 people and provide the total count.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 34, + "database_schema_index": 0, + "natural_language_query": "Show all reservations with a partySize of at least 5 people, count how many times each reservationName occurs, and group the results by whether the reservation is confirmed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Show all reservations with a partySize of at least 5 people, count how many times each reservationName occurs, and group the results by whether the reservation is confirmed.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "confirmed" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show all reservations with a partySize of at least 5 people, count how many times each reservationName occurs, and group the results by whether the reservation is confirmed.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "reservationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10000 + }, + "boolean_property_aggregation": null, + "groupby_property": "isConfirmed", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 35, + "database_schema_index": 0, + "natural_language_query": "Find all menu items with a price less than $20 and determine the top 3 most common menuItem names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find all menu items with a price less than $20 and determine the top 3 most common menuItem names.", + "target_collection": "Menus", + "search_query": null, + "integer_property_filter": { + "property_name": "price", + "operator": "<", + "value": 20.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "menuItem", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all menu items with a price less than $20 and determine the top 3 most common menuItem names.", + "target_collection": "MenuItems", + "search_query": "", + "limit": 5, + "integer_property_filter": { + "property_name": "price", + "operator": "<", + "value": 20.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "menuItem", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 36, + "database_schema_index": 0, + "natural_language_query": "Find reservations that have at least 5 people in partySize, aggregate them by counting the number of true values in the confirmed status, and group the results by reservationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find reservations that have at least 5 people in partySize, aggregate them by counting the number of true values in the confirmed status, and group the results by reservationName.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find reservations that have at least 5 people in partySize, aggregate them by counting the number of true values in the confirmed status, and group the results by reservationName.", + "target_collection": "Reservations", + "search_query": "", + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "confirmed", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "reservationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 37, + "database_schema_index": 0, + "natural_language_query": "Find all reservations where there are more than 4 people in the partySize and count how many of these reservations are confirmed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find all reservations where there are more than 4 people in the partySize and count how many of these reservations are confirmed.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all reservations where there are more than 4 people in the partySize and count how many of these reservations are confirmed.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isConfirmed", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 38, + "database_schema_index": 0, + "natural_language_query": "Find reservations where the partySize is at least 4 and group the results by whether the reservation is confirmed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find reservations where the partySize is at least 4 and group the results by whether the reservation is confirmed.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "confirmed" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find reservations where the partySize is at least 4 and group the results by whether the reservation is confirmed.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "isConfirmed", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 39, + "database_schema_index": 0, + "natural_language_query": "Find all reservations with a partySize that is at least 5", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find all reservations with a partySize that is at least 5", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all reservations with a partySize that is at least 5", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "partySize", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 40, + "database_schema_index": 0, + "natural_language_query": "Find Italian restaurants by filtering descriptions that contain the word 'Italian', then calculate the average rating of these restaurants, and group results by whether they are currently open now.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find Italian restaurants by filtering descriptions that contain the word 'Italian', then calculate the average rating of these restaurants, and group results by whether they are currently open now.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "Italian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find Italian restaurants by filtering descriptions that contain the word 'Italian', then calculate the average rating of these restaurants, and group results by whether they are currently open now.", + "target_collection": "Restaurants", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "Italian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 41, + "database_schema_index": 0, + "natural_language_query": "Find restaurants with the word 'vegan' in their description and count how many such restaurants exist.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants with the word 'vegan' in their description and count how many such restaurants exist.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "%vegan%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants with the word 'vegan' in their description and count how many such restaurants exist.", + "target_collection": "Restaurants", + "search_query": "vegan", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 42, + "database_schema_index": 0, + "natural_language_query": "Retrieve the count of restaurants containing 'Italian' in the description, group them by the openNow status, and provide the count of each restaurant name within those groups.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Retrieve the count of restaurants containing 'Italian' in the description, group them by the openNow status, and provide the count of each restaurant name within those groups.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "%Italian%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Retrieve the count of restaurants containing 'Italian' in the description, group them by the openNow status, and provide the count of each restaurant name within those groups.", + "target_collection": "Restaurants", + "search_query": "Italian", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1000 + }, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 43, + "database_schema_index": 0, + "natural_language_query": "Find menu items with descriptions containing the word 'spicy' and determine the top three most common item names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find menu items with descriptions containing the word 'spicy' and determine the top three most common item names.", + "target_collection": "Menus", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "itemDescription", + "operator": "LIKE", + "value": "spicy" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "menuItem", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find menu items with descriptions containing the word 'spicy' and determine the top three most common item names.", + "target_collection": "MenuItems", + "search_query": "spicy", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 44, + "database_schema_index": 0, + "natural_language_query": "Find reservations that mention 'birthday' in their notes, count how many of these reservations are confirmed, and group the results by the name under which each reservation is made.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find reservations that mention 'birthday' in their notes, count how many of these reservations are confirmed, and group the results by the name under which each reservation is made.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "notes", + "operator": "LIKE", + "value": "%birthday%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find reservations that mention 'birthday' in their notes, count how many of these reservations are confirmed, and group the results by the name under which each reservation is made.", + "target_collection": "Reservations", + "search_query": "birthday", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "confirmed", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 45, + "database_schema_index": 0, + "natural_language_query": "Find all restaurants that mention 'vegan' in their description and count how many are currently open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find all restaurants that mention 'vegan' in their description and count how many are currently open.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "vegan" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all restaurants that mention 'vegan' in their description and count how many are currently open.", + "target_collection": "Restaurants", + "search_query": "vegan", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 46, + "database_schema_index": 0, + "natural_language_query": "Find restaurants where the description contains 'Italian cuisine' and group these results by their name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants where the description contains 'Italian cuisine' and group these results by their name.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "Italian cuisine" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants where the description contains 'Italian cuisine' and group these results by their name.", + "target_collection": "Restaurants", + "search_query": "Italian cuisine", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 47, + "database_schema_index": 0, + "natural_language_query": "Find restaurants in the Restaurants collection where the description contains the keyword 'Italian'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants in the Restaurants collection where the description contains the keyword 'Italian'.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "Italian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants in the Restaurants collection where the description contains the keyword 'Italian'.", + "target_collection": "Restaurants", + "search_query": "Italian", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 48, + "database_schema_index": 0, + "natural_language_query": "Find restaurants that are currently open, group them by their averageRating, and calculate the mean averageRating for each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants that are currently open, group them by their averageRating, and calculate the mean averageRating for each group.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants that are currently open, group them by their averageRating, and calculate the mean averageRating for each group.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 49, + "database_schema_index": 0, + "natural_language_query": "Determine the average rating of all restaurants that are open now, filtering by the openNow property, and calculate the mean on the averageRating property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Determine the average rating of all restaurants that are open now, filtering by the openNow property, and calculate the mean on the averageRating property.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Determine the average rating of all restaurants that are open now, filtering by the openNow property, and calculate the mean on the averageRating property.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 50, + "database_schema_index": 0, + "natural_language_query": "What types of cuisines are available in restaurants that are currently open, grouped by their average rating?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What types of cuisines are available in restaurants that are currently open, grouped by their average rating?", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "What types of cuisines are available in restaurants that are currently open, grouped by their average rating?", + "target_collection": "Restaurants", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description.cuisine", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10 + }, + "boolean_property_aggregation": null, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 51, + "database_schema_index": 0, + "natural_language_query": "Identify the most common cuisine type among all restaurants that are currently open (using 'openNow' property for filtering and 'description' property for text aggregation).", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Identify the most common cuisine type among all restaurants that are currently open (using 'openNow' property for filtering and 'description' property for text aggregation).", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify the most common cuisine type among all restaurants that are currently open (using 'openNow' property for filtering and 'description' property for text aggregation).", + "target_collection": "Restaurants", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": "", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + }, + { + "query_index": 52, + "database_schema_index": 0, + "natural_language_query": "Calculate the percentage of restaurants that are currently open (openNow = true), and group these open restaurants by their averageRating to understand how many are open in each rating category.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Calculate the percentage of restaurants that are currently open (openNow = true), and group these open restaurants by their averageRating to understand how many are open in each rating category.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate the percentage of restaurants that are currently open (openNow = true), and group these open restaurants by their averageRating to understand how many are open in each rating category.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 53, + "database_schema_index": 0, + "natural_language_query": "Show me all confirmed reservations and count the total number of confirmed versus unconfirmed reservations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Show me all confirmed reservations and count the total number of confirmed versus unconfirmed reservations.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "confirmed", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Show me all confirmed reservations and count the total number of confirmed versus unconfirmed reservations.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isConfirmed", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isConfirmed", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "isConfirmed", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 54, + "database_schema_index": 0, + "natural_language_query": "Show all restaurants that are currently open (openNow = true), and group these by the type of cuisine mentioned in the description to see how many open restaurants exist for each cuisine type.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Show all restaurants that are currently open (openNow = true), and group these by the type of cuisine mentioned in the description to see how many open restaurants exist for each cuisine type.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "description" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show all restaurants that are currently open (openNow = true), and group these by the type of cuisine mentioned in the description to see how many open restaurants exist for each cuisine type.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "description.cuisine", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 55, + "database_schema_index": 0, + "natural_language_query": "Find restaurants where openNow is true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find restaurants where openNow is true.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find restaurants where openNow is true.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 56, + "database_schema_index": 0, + "natural_language_query": "Find the total party size for reservations grouped by reservationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find the total party size for reservations grouped by reservationName.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the total party size for reservations grouped by reservationName.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "reservationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 57, + "database_schema_index": 0, + "natural_language_query": "Count the number of reservations based on their partySize.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Count the number of reservations based on their partySize.", + "target_collection": "Reservations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Count the number of reservations based on their partySize.", + "target_collection": "Reservations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "partySize", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 58, + "database_schema_index": 0, + "natural_language_query": "Find the types of cuisines mentioned most frequently in the restaurant descriptions, grouped by whether the restaurants are currently open or closed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Find the types of cuisines mentioned most frequently in the restaurant descriptions, grouped by whether the restaurants are currently open or closed.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": "openNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the types of cuisines mentioned most frequently in the restaurant descriptions, grouped by whether the restaurants are currently open or closed.", + "target_collection": "Restaurants", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description.cuisine", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10 + }, + "boolean_property_aggregation": null, + "groupby_property": "openNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 59, + "database_schema_index": 0, + "natural_language_query": "What are the three most common phrases in the description of restaurants?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "What are the three most common phrases in the description of restaurants?", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the three most common phrases in the description of restaurants?", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 60, + "database_schema_index": 0, + "natural_language_query": "Calculate the percentage of restaurants that are open now within each grouping by their average rating.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Calculate the percentage of restaurants that are open now within each grouping by their average rating.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate the percentage of restaurants that are open now within each grouping by their average rating.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageRating", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openNow", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 61, + "database_schema_index": 0, + "natural_language_query": "Calculate the percentage of menu items that are vegetarian based on the isVegetarian property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Calculate the percentage of menu items that are vegetarian based on the isVegetarian property.", + "target_collection": "Menus", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isVegetarian", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate the percentage of menu items that are vegetarian based on the isVegetarian property.", + "target_collection": "MenuItems", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isVegetarian", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 62, + "database_schema_index": 0, + "natural_language_query": "Group restaurants by their averageRating to analyze patterns across different rating categories, helping to understand how many restaurants fall into each rating group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Restaurants", + "properties": [ + { + "name": "name", + "data_type": [ + "string" + ], + "description": "The name of the restaurant." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed description and summary of the restaurant, including cuisine type and ambiance." + }, + { + "name": "averageRating", + "data_type": [ + "number" + ], + "description": "The average rating score out of 5 for the restaurant." + }, + { + "name": "openNow", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the restaurant is currently open." + } + ], + "envisioned_use_case_overview": "This schema focuses on enabling users to discover restaurants based on a comprehensive profile. With semantic search, users can find restaurants by cuisine, ambiance, or special features." + }, + { + "name": "Menus", + "properties": [ + { + "name": "menuItem", + "data_type": [ + "string" + ], + "description": "The name of the menu item." + }, + { + "name": "itemDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the menu item, including ingredients and preparation style." + }, + { + "name": "price", + "data_type": [ + "number" + ], + "description": "The price of the menu item." + }, + { + "name": "isVegetarian", + "data_type": [ + "boolean" + ], + "description": "A flag to indicate if the menu item is vegetarian." + } + ], + "envisioned_use_case_overview": "This schema assists in linking dining experiences with specific restaurants through their menus. Rich search features allow customers to find dishes tailored to dietary needs and price points." + }, + { + "name": "Reservations", + "properties": [ + { + "name": "reservationName", + "data_type": [ + "string" + ], + "description": "The name under which the reservation is made." + }, + { + "name": "notes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the reservation, such as special requests or celebrations." + }, + { + "name": "partySize", + "data_type": [ + "number" + ], + "description": "The number of persons in the reservation." + }, + { + "name": "confirmed", + "data_type": [ + "boolean" + ], + "description": "A flag indicating whether the reservation is confirmed." + } + ], + "envisioned_use_case_overview": "This schema integrates with the restaurants by managing booking experiences. Semantic search of reservations can uncover trends in dining preferences and commonly requested meal attributes." + } + ] + }, + "corresponding_natural_language_query": "Group restaurants by their averageRating to analyze patterns across different rating categories, helping to understand how many restaurants fall into each rating group.", + "target_collection": "Restaurants", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating" + }, + "predicted_query": { + "corresponding_natural_language_query": "Group restaurants by their averageRating to analyze patterns across different rating categories, helping to understand how many restaurants fall into each rating group.", + "target_collection": "Restaurants", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averageRating", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 63, + "database_schema_index": 0, + "natural_language_query": "Identify clinics that specialize in pediatric care using semantic search, filter out only those with an averagePatientSatisfaction of 4.5 or higher, calculate the mean averagePatientSatisfaction, and group these results based on whether they are acceptingNewPatients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Identify clinics that specialize in pediatric care using semantic search, filter out only those with an averagePatientSatisfaction of 4.5 or higher, calculate the mean averagePatientSatisfaction, and group these results based on whether they are acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": "Find clinics that specialize in pediatric care", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify clinics that specialize in pediatric care using semantic search, filter out only those with an averagePatientSatisfaction of 4.5 or higher, calculate the mean averagePatientSatisfaction, and group these results based on whether they are acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": "pediatric care", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 64, + "database_schema_index": 1, + "natural_language_query": "Retrieve clinics with descriptions including 'comprehensive healthcare', having averagePatientSatisfaction greater than 4.5, and count how many of these clinics are acceptingNewPatients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Retrieve clinics with descriptions including 'comprehensive healthcare', having averagePatientSatisfaction greater than 4.5, and count how many of these clinics are acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": "Find clinics whose description includes comprehensive healthcare", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Retrieve clinics with descriptions including 'comprehensive healthcare', having averagePatientSatisfaction greater than 4.5, and count how many of these clinics are acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": "comprehensive healthcare", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 65, + "database_schema_index": 1, + "natural_language_query": "Find clinics related to cardiology with average patient satisfaction higher than 4. Resulting clinics should be grouped based on whether they are accepting new patients or not, and within each group, identify the top 5 most common service descriptions.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics related to cardiology with average patient satisfaction higher than 4. Resulting clinics should be grouped based on whether they are accepting new patients or not, and within each group, identify the top 5 most common service descriptions.", + "target_collection": "Clinics", + "search_query": "cardiology", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics related to cardiology with average patient satisfaction higher than 4. Resulting clinics should be grouped based on whether they are accepting new patients or not, and within each group, identify the top 5 most common service descriptions.", + "target_collection": "Clinics", + "search_query": "cardiology", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "serviceDescription", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 66, + "database_schema_index": 1, + "natural_language_query": "Find doctors with expertise related to dermatology and skin care, who have at least 10 years of experience, and retrieve the top 3 most common doctor names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors with expertise related to dermatology and skin care, who have at least 10 years of experience, and retrieve the top 3 most common doctor names.", + "target_collection": "Doctors", + "search_query": "Find doctors with expertise related to dermatology and skin care", + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "doctorName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors with expertise related to dermatology and skin care, who have at least 10 years of experience, and retrieve the top 3 most common doctor names.", + "target_collection": "Doctors", + "search_query": "dermatology and skin care", + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 10.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 67, + "database_schema_index": 1, + "natural_language_query": "Find clinics specialized in cardiovascular healthcare by searching \"description\"; filter these to only show clinics with an \"averagePatientSatisfaction\" greater than 4.5; determine the percentage of these clinics \"acceptingNewPatients\"; and finally, organize the results by \"clinicName\".", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics specialized in cardiovascular healthcare by searching \"description\"; filter these to only show clinics with an \"averagePatientSatisfaction\" greater than 4.5; determine the percentage of these clinics \"acceptingNewPatients\"; and finally, organize the results by \"clinicName\".", + "target_collection": "Clinics", + "search_query": "Find clinics that are specialized in cardiovascular healthcare.", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics specialized in cardiovascular healthcare by searching \"description\"; filter these to only show clinics with an \"averagePatientSatisfaction\" greater than 4.5; determine the percentage of these clinics \"acceptingNewPatients\"; and finally, organize the results by \"clinicName\".", + "target_collection": "Clinics", + "search_query": "cardiovascular healthcare", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 68, + "database_schema_index": 1, + "natural_language_query": "Find clinics offering pediatric services with an average patient satisfaction score greater than 4, and count the total number of clinics that are currently accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics offering pediatric services with an average patient satisfaction score greater than 4, and count the total number of clinics that are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "Find clinics offering pediatric services", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics offering pediatric services with an average patient satisfaction score greater than 4, and count the total number of clinics that are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "pediatric services", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 69, + "database_schema_index": 1, + "natural_language_query": "Find doctors who specialize in neurology with more than 10 years of experience, and group the results by whether they are currently practicing or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors who specialize in neurology with more than 10 years of experience, and group the results by whether they are currently practicing or not.", + "target_collection": "Doctors", + "search_query": "Find doctors who specialize in neurology", + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors who specialize in neurology with more than 10 years of experience, and group the results by whether they are currently practicing or not.", + "target_collection": "Doctors", + "search_query": "", + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10.0 + }, + "text_property_filter": { + "property_name": "specialization", + "operator": "LIKE", + "value": "neurology" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "isCurrentlyPracticing", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + }, + { + "query_index": 70, + "database_schema_index": 1, + "natural_language_query": "Find clinics with a description similar to 'pediatric care' that have an averagePatientSatisfaction score of at least 4.5.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics with a description similar to 'pediatric care' that have an averagePatientSatisfaction score of at least 4.5.", + "target_collection": "Clinics", + "search_query": "pediatric care", + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics with a description similar to 'pediatric care' that have an averagePatientSatisfaction score of at least 4.5.", + "target_collection": "Clinics", + "search_query": "pediatric care", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 71, + "database_schema_index": 1, + "natural_language_query": "Identify clinics that offer dental services by performing a search for relevant specialties, filter specifically for a clinic named Sunny Clinic, determine the maximum average patient satisfaction score, and group the results based on whether they are accepting new patients or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Identify clinics that offer dental services by performing a search for relevant specialties, filter specifically for a clinic named Sunny Clinic, determine the maximum average patient satisfaction score, and group the results based on whether they are accepting new patients or not.", + "target_collection": "Clinics", + "search_query": "Find clinics that offer dental services and check their specialties", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "Sunny Clinic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify clinics that offer dental services by performing a search for relevant specialties, filter specifically for a clinic named Sunny Clinic, determine the maximum average patient satisfaction score, and group the results based on whether they are accepting new patients or not.", + "target_collection": "Clinics", + "search_query": "dental services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "Sunny Clinic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 72, + "database_schema_index": 1, + "natural_language_query": "Find clinics with a description similar to 'clinic with specialties in cardiology and pediatric care', where the clinicName is exactly 'City Health Center', and calculate the average of averagePatientSatisfaction for these clinics.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics with a description similar to 'clinic with specialties in cardiology and pediatric care', where the clinicName is exactly 'City Health Center', and calculate the average of averagePatientSatisfaction for these clinics.", + "target_collection": "Clinics", + "search_query": "clinic with specialties in cardiology and pediatric care", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "City Health Center" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics with a description similar to 'clinic with specialties in cardiology and pediatric care', where the clinicName is exactly 'City Health Center', and calculate the average of averagePatientSatisfaction for these clinics.", + "target_collection": "Clinics", + "search_query": "clinic with specialties in cardiology and pediatric care", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "City Health Center" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 73, + "database_schema_index": 1, + "natural_language_query": "Find clinics that offer family healthcare services using semantic search, and are accepting new patients. Count the number of unique clinics and group them by average patient satisfaction score.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that offer family healthcare services using semantic search, and are accepting new patients. Count the number of unique clinics and group them by average patient satisfaction score.", + "target_collection": "Clinics", + "search_query": "Family healthcare services", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 74, + "database_schema_index": 1, + "natural_language_query": "Find clinics that describe themselves as offering holistic healthcare services, filter those with 'Health' in their clinicName, and identify the top 3 most frequently occurring clinic names from those results.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that describe themselves as offering holistic healthcare services, filter those with 'Health' in their clinicName, and identify the top 3 most frequently occurring clinic names from those results.", + "target_collection": "Clinics", + "search_query": "Find clinics that offer holistic healthcare services based on detailed description", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "LIKE", + "value": "%Health%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "clinicName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that describe themselves as offering holistic healthcare services, filter those with 'Health' in their clinicName, and identify the top 3 most frequently occurring clinic names from those results.", + "target_collection": "Clinics", + "search_query": "holistic healthcare services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "LIKE", + "value": "Health" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "clinicName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 75, + "database_schema_index": 1, + "natural_language_query": "Find the best clinics known for pediatric services, where clinic names start with 'A', group them by average patient satisfaction, and count how many are accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find the best clinics known for pediatric services, where clinic names start with 'A', group them by average patient satisfaction, and count how many are accepting new patients.", + "target_collection": "Clinics", + "search_query": "Find the best clinics known for pediatric services", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "LIKE", + "value": "A%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the best clinics known for pediatric services, where clinic names start with 'A', group them by average patient satisfaction, and count how many are accepting new patients.", + "target_collection": "Clinics", + "search_query": "pediatric services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "A%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "averagePatientSatisfaction", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 76, + "database_schema_index": 1, + "natural_language_query": "Find appointments related to annual health check-ups by searching in appointmentNotes for 'check-up', and count how many of these appointments are confirmed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find appointments related to annual health check-ups by searching in appointmentNotes for 'check-up', and count how many of these appointments are confirmed.", + "target_collection": "Appointments", + "search_query": "Find the appointments that are relevant to annual health check-ups", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "appointmentNotes", + "operator": "LIKE", + "value": "check-up" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find appointments related to annual health check-ups by searching in appointmentNotes for 'check-up', and count how many of these appointments are confirmed.", + "target_collection": "Appointments", + "search_query": "check-up", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "confirmed", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 77, + "database_schema_index": 1, + "natural_language_query": "Search for clinics that have descriptions mentioning advanced medical technology, filter by the clinic name \"Healthcare Plus Clinic\", and group the results by whether they are accepting new patients, aggregating average patient satisfaction scores within each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Search for clinics that have descriptions mentioning advanced medical technology, filter by the clinic name \"Healthcare Plus Clinic\", and group the results by whether they are accepting new patients, aggregating average patient satisfaction scores within each group.", + "target_collection": "Clinics", + "search_query": "Find clinics whose description includes advanced medical technology.", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "Healthcare Plus Clinic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for clinics that have descriptions mentioning advanced medical technology, filter by the clinic name \"Healthcare Plus Clinic\", and group the results by whether they are accepting new patients, aggregating average patient satisfaction scores within each group.", + "target_collection": "Clinics", + "search_query": "advanced medical technology", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Healthcare Plus Clinic" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "patientSatisfactionScore", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 78, + "database_schema_index": 1, + "natural_language_query": "Search for clinics whose description indicates a focus on comprehensive dermatology services and skin care treatments, and filter to include only those clinics with 'Dermatology' in their clinicName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Search for clinics whose description indicates a focus on comprehensive dermatology services and skin care treatments, and filter to include only those clinics with 'Dermatology' in their clinicName.", + "target_collection": "Clinics", + "search_query": "Find clinics that provide comprehensive dermatology services and skin care treatments", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "LIKE", + "value": "*Dermatology*" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for clinics whose description indicates a focus on comprehensive dermatology services and skin care treatments, and filter to include only those clinics with 'Dermatology' in their clinicName.", + "target_collection": "Clinics", + "search_query": "comprehensive dermatology services skin care treatments", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "LIKE", + "value": "Dermatology" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 79, + "database_schema_index": 1, + "natural_language_query": "Find clinics based on a high patient satisfaction, filter to include only those currently accepting new patients, perform an average calculation of the averagePatientSatisfaction, and group the results by clinic name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics based on a high patient satisfaction, filter to include only those currently accepting new patients, perform an average calculation of the averagePatientSatisfaction, and group the results by clinic name.", + "target_collection": "Clinics", + "search_query": "high patient satisfaction", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics based on a high patient satisfaction, filter to include only those currently accepting new patients, perform an average calculation of the averagePatientSatisfaction, and group the results by clinic name.", + "target_collection": "Clinics", + "search_query": "high patient satisfaction", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.0 + }, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 80, + "database_schema_index": 1, + "natural_language_query": "Find clinics that are conceptually related to pediatrics, are accepting new patients, and calculate the mean average patient satisfaction score across all such clinics.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that are conceptually related to pediatrics, are accepting new patients, and calculate the mean average patient satisfaction score across all such clinics.", + "target_collection": "Clinics", + "search_query": "pediatrics", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that are conceptually related to pediatrics, are accepting new patients, and calculate the mean average patient satisfaction score across all such clinics.", + "target_collection": "Clinics", + "search_query": "pediatrics", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "patientSatisfactionScore", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 81, + "database_schema_index": 1, + "natural_language_query": "Find doctors with expertise in cardiology who are currently practicing, show how many doctors there are per expertise, and group them by their expertise category.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors with expertise in cardiology who are currently practicing, show how many doctors there are per expertise, and group them by their expertise category.", + "target_collection": "Doctors", + "search_query": "Find doctors with expertise in 'cardiology'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyPracticing", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "expertise" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 82, + "database_schema_index": 1, + "natural_language_query": "Find clinics that match specific healthcare needs and services, filter to show only those accepting new patients, and aggregate to find the top 5 most common descriptions of these clinics.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that match specific healthcare needs and services, filter to show only those accepting new patients, and aggregate to find the top 5 most common descriptions of these clinics.", + "target_collection": "Clinics", + "search_query": "Find clinics that provide specialties or services mentioned in the search", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that match specific healthcare needs and services, filter to show only those accepting new patients, and aggregate to find the top 5 most common descriptions of these clinics.", + "target_collection": "Clinics", + "search_query": "healthcare needs and services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 83, + "database_schema_index": 1, + "natural_language_query": "Identify clinics that provide cardiology services (using descriptions for search), determine which of them are currently accepting new patients, and count the number of clinics within each range of average patient satisfaction scores.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Identify clinics that provide cardiology services (using descriptions for search), determine which of them are currently accepting new patients, and count the number of clinics within each range of average patient satisfaction scores.", + "target_collection": "Clinics", + "search_query": "Find clinics offering cardiology services", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 84, + "database_schema_index": 1, + "natural_language_query": "Find clinics that match the concept of 'family healthcare services', filter those that are accepting new patients, and calculate the percentage of clinics that are accepting new patients among the total results.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that match the concept of 'family healthcare services', filter those that are accepting new patients, and calculate the percentage of clinics that are accepting new patients among the total results.", + "target_collection": "Clinics", + "search_query": "Find clinics that match the concept of 'family healthcare services'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that match the concept of 'family healthcare services', filter those that are accepting new patients, and calculate the percentage of clinics that are accepting new patients among the total results.", + "target_collection": "Clinics", + "search_query": "family healthcare services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 85, + "database_schema_index": 1, + "natural_language_query": "Find clinics that specialize in pediatric care and are accepting new patients, then group the results by their average patient satisfaction score.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that specialize in pediatric care and are accepting new patients, then group the results by their average patient satisfaction score.", + "target_collection": "Clinics", + "search_query": "Find clinics that specialize in pediatric care", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that specialize in pediatric care and are accepting new patients, then group the results by their average patient satisfaction score.", + "target_collection": "Clinics", + "search_query": "pediatric care", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfactionScore", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 86, + "database_schema_index": 1, + "natural_language_query": "Find clinics that specialize in cardiac care based on their description and are currently accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that specialize in cardiac care based on their description and are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "Find clinics that specialize in cardiac care based on their description", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that specialize in cardiac care based on their description and are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "cardiac care", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 87, + "database_schema_index": 1, + "natural_language_query": "List clinics that provide excellent healthcare services. Within these clinics, group them by their clinic names and count how many are currently accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "List clinics that provide excellent healthcare services. Within these clinics, group them by their clinic names and count how many are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "Find clinics that match the description of providing excellent healthcare services with high specialties", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "List clinics that provide excellent healthcare services. Within these clinics, group them by their clinic names and count how many are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "excellent healthcare services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 88, + "database_schema_index": 1, + "natural_language_query": "Find doctors in the Doctors collection specializing in 'cardiology' based on their expertise property, and calculate the mean yearsOfExperience for these doctors.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors in the Doctors collection specializing in 'cardiology' based on their expertise property, and calculate the mean yearsOfExperience for these doctors.", + "target_collection": "Doctors", + "search_query": "Find doctors specializing in cardiology", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors in the Doctors collection specializing in 'cardiology' based on their expertise property, and calculate the mean yearsOfExperience for these doctors.", + "target_collection": "Doctors", + "search_query": "cardiology", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "expertise", + "operator": "LIKE", + "value": "cardiology" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 89, + "database_schema_index": 1, + "natural_language_query": "Find clinics that provide 'dental services', group them by whether they are accepting new patients, and count how many clinics are in each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that provide 'dental services', group them by whether they are accepting new patients, and count how many clinics are in each group.", + "target_collection": "Clinics", + "search_query": "Find clinics providing 'dental services'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that provide 'dental services', group them by whether they are accepting new patients, and count how many clinics are in each group.", + "target_collection": "Clinics", + "search_query": "dental services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 90, + "database_schema_index": 1, + "natural_language_query": "Find clinics offering high-quality healthcare services based on their description, and count the number of unique clinic names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics offering high-quality healthcare services based on their description, and count the number of unique clinic names.", + "target_collection": "Clinics", + "search_query": "High-quality healthcare services", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics offering high-quality healthcare services based on their description, and count the number of unique clinic names.", + "target_collection": "Clinics", + "search_query": "high-quality healthcare services", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "uniqueClinicNames", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 91, + "database_schema_index": 1, + "natural_language_query": "Search for clinics where the description mentions specific healthcare services you need, determine what percentage of these clinics are accepting new patients, and group the results by clinicName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Search for clinics where the description mentions specific healthcare services you need, determine what percentage of these clinics are accepting new patients, and group the results by clinicName.", + "target_collection": "Clinics", + "search_query": "Find clinics with descriptions similar to healthcare services or specialties you need", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for clinics where the description mentions specific healthcare services you need, determine what percentage of these clinics are accepting new patients, and group the results by clinicName.", + "target_collection": "Clinics", + "search_query": "specific healthcare services you need", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 92, + "database_schema_index": 1, + "natural_language_query": "How many clinics that offer pediatrics and family healthcare are currently accepting new patients?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "How many clinics that offer pediatrics and family healthcare are currently accepting new patients?", + "target_collection": "Clinics", + "search_query": "Find clinics that offer pediatrics and family healthcare", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "How many clinics that offer pediatrics and family healthcare are currently accepting new patients?", + "target_collection": "Clinics", + "search_query": "pediatrics family healthcare", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "id", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 93, + "database_schema_index": 1, + "natural_language_query": "Find clinics that specialize in pediatric services, offer state-of-the-art facilities, and have high ratings for patient care experience, and then group these clinics based on whether they are accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that specialize in pediatric services, offer state-of-the-art facilities, and have high ratings for patient care experience, and then group these clinics based on whether they are accepting new patients.", + "target_collection": "Clinics", + "search_query": "Find clinics that specialize in pediatric services, offer state-of-the-art facilities, and have high ratings for patient care experience", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that specialize in pediatric services, offer state-of-the-art facilities, and have high ratings for patient care experience, and then group these clinics based on whether they are accepting new patients.", + "target_collection": "Clinics", + "search_query": "pediatric services state-of-the-art facilities high ratings patient care experience", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 94, + "database_schema_index": 1, + "natural_language_query": "What clinics are recognized for their exceptional orthopedic services and a high emphasis on patient care?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "What clinics are recognized for their exceptional orthopedic services and a high emphasis on patient care?", + "target_collection": "Clinics", + "search_query": "Find clinics that are renowned for exceptional orthopedic services and have a high focus on patient care.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What clinics are recognized for their exceptional orthopedic services and a high emphasis on patient care?", + "target_collection": "Clinics", + "search_query": "exceptional orthopedic services high emphasis on patient care", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 95, + "database_schema_index": 1, + "natural_language_query": "Find doctors with more than 10 yearsOfExperience, calculate the average yearsOfExperience for these doctors, and group the results by whether they are currentlyPracticing or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors with more than 10 yearsOfExperience, calculate the average yearsOfExperience for these doctors, and group the results by whether they are currentlyPracticing or not.", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors with more than 10 yearsOfExperience, calculate the average yearsOfExperience for these doctors, and group the results by whether they are currentlyPracticing or not.", + "target_collection": "Doctors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 96, + "database_schema_index": 1, + "natural_language_query": "Find the number of clinics where the averagePatientSatisfaction score is at least 4.5", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find the number of clinics where the averagePatientSatisfaction score is at least 4.5", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the number of clinics where the averagePatientSatisfaction score is at least 4.5", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 97, + "database_schema_index": 1, + "natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5, then group results by acceptingNewPatients status and determine the top 3 most common specialties within each group's description.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5, then group results by acceptingNewPatients status and determine the top 3 most common specialties within each group's description.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5, then group results by acceptingNewPatients status and determine the top 3 most common specialties within each group's description.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description.specialties", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 98, + "database_schema_index": 1, + "natural_language_query": "Find appointments that have an appointmentDuration of at least 30 minutes and determine the most common patientName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find appointments that have an appointmentDuration of at least 30 minutes and determine the most common patientName.", + "target_collection": "Appointments", + "search_query": null, + "integer_property_filter": { + "property_name": "appointmentDuration", + "operator": ">=", + "value": 30 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "patientName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find appointments that have an appointmentDuration of at least 30 minutes and determine the most common patientName.", + "target_collection": "Appointments", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "appointmentDuration", + "operator": ">=", + "value": 30 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "patientName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 99, + "database_schema_index": 1, + "natural_language_query": "Group clinics by their clinicName, but only include those with an averagePatientSatisfaction of at least 4.5, and count how many of these clinics are currently accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Group clinics by their clinicName, but only include those with an averagePatientSatisfaction of at least 4.5, and count how many of these clinics are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Group clinics by their clinicName, but only include those with an averagePatientSatisfaction of at least 4.5, and count how many of these clinics are currently accepting new patients.", + "target_collection": "Clinics", + "search_query": "", + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 100, + "database_schema_index": 1, + "natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5 and count how many of these clinics are currently acceptingNewPatients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5 and count how many of these clinics are currently acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics where the averagePatientSatisfaction is at least 4.5 and count how many of these clinics are currently acceptingNewPatients.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averagePatientSatisfaction", + "operator": ">=", + "value": 4.5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 101, + "database_schema_index": 1, + "natural_language_query": "Find doctors with at least 10 years of experience and group results by whether they are currently practicing.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors with at least 10 years of experience and group results by whether they are currently practicing.", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors with at least 10 years of experience and group results by whether they are currently practicing.", + "target_collection": "Doctors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 102, + "database_schema_index": 1, + "natural_language_query": "Find doctors who have more than 10 years in yearsOfExperience", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find doctors who have more than 10 years in yearsOfExperience", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find doctors who have more than 10 years in yearsOfExperience", + "target_collection": "Doctors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 103, + "database_schema_index": 1, + "natural_language_query": "Find all clinics where the description contains the keyword 'specialty', group them by their acceptingNewPatients status, and calculate the maximum averagePatientSatisfaction score for each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find all clinics where the description contains the keyword 'specialty', group them by their acceptingNewPatients status, and calculate the maximum averagePatientSatisfaction score for each group.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "specialty" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all clinics where the description contains the keyword 'specialty', group them by their acceptingNewPatients status, and calculate the maximum averagePatientSatisfaction score for each group.", + "target_collection": "Clinics", + "search_query": "specialty", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 104, + "database_schema_index": 1, + "natural_language_query": "How many appointments have the word 'consultation' in their appointmentNotes and what is their total count for appointmentDuration?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "How many appointments have the word 'consultation' in their appointmentNotes and what is their total count for appointmentDuration?", + "target_collection": "Appointments", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "appointmentNotes", + "operator": "LIKE", + "value": "consultation" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "How many appointments have the word 'consultation' in their appointmentNotes and what is their total count for appointmentDuration?", + "target_collection": "Appointments", + "search_query": "consultation", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "appointmentNotes", + "operator": "LIKE", + "value": "%consultation%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "appointmentDuration", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 105, + "database_schema_index": 1, + "natural_language_query": "Identify how many different averagePatientSatisfaction scores exist for clinics whose description includes the term 'multispecialty', grouped by the description property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Identify how many different averagePatientSatisfaction scores exist for clinics whose description includes the term 'multispecialty', grouped by the description property.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "multispecialty" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "description" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='TOP_OCCURRENCES', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 106, + "database_schema_index": 1, + "natural_language_query": "Find the number of unique clinicName values from the Clinics collection where the description contains the word 'dental' by counting these occurrences.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find the number of unique clinicName values from the Clinics collection where the description contains the word 'dental' by counting these occurrences.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "%dental%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the number of unique clinicName values from the Clinics collection where the description contains the word 'dental' by counting these occurrences.", + "target_collection": "Clinics", + "search_query": "dental", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "clinicName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10000 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 107, + "database_schema_index": 1, + "natural_language_query": "Show the percentage of clinics accepting new patients, grouped by clinicName, where the clinic's description contains the word pediatrics.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Show the percentage of clinics accepting new patients, grouped by clinicName, where the clinic's description contains the word pediatrics.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "pediatrics" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show the percentage of clinics accepting new patients, grouped by clinicName, where the clinic's description contains the word pediatrics.", + "target_collection": "Clinics", + "search_query": "pediatrics", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 108, + "database_schema_index": 1, + "natural_language_query": "Find clinics where the description includes 'cancer', and determine how many of these clinics are accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics where the description includes 'cancer', and determine how many of these clinics are accepting new patients.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "%cancer%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics where the description includes 'cancer', and determine how many of these clinics are accepting new patients.", + "target_collection": "Clinics", + "search_query": "cancer", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 109, + "database_schema_index": 1, + "natural_language_query": "Find clinics that have 'pediatrics' in their description, and group them by whether they are accepting new patients.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that have 'pediatrics' in their description, and group them by whether they are accepting new patients.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "pediatrics" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that have 'pediatrics' in their description, and group them by whether they are accepting new patients.", + "target_collection": "Clinics", + "search_query": "pediatrics", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "description", + "operator": "LIKE", + "value": "%pediatrics%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 110, + "database_schema_index": 1, + "natural_language_query": "Retrieve the clinic that has the exact clinicName 'Community HealthCare Center'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Retrieve the clinic that has the exact clinicName 'Community HealthCare Center'.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "Community HealthCare Center" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Retrieve the clinic that has the exact clinicName 'Community HealthCare Center'.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "clinicName", + "operator": "=", + "value": "Community HealthCare Center" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 111, + "database_schema_index": 1, + "natural_language_query": "For clinics that are accepting new patients, calculate the mean averagePatientSatisfaction score for each category described by 'description'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "For clinics that are accepting new patients, calculate the mean averagePatientSatisfaction score for each category described by 'description'.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "description" + }, + "predicted_query": { + "corresponding_natural_language_query": "For clinics that are accepting new patients, calculate the mean averagePatientSatisfaction score for each category described by 'description'.", + "target_collection": "Clinics", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10 + }, + "boolean_property_aggregation": null, + "groupby_property": "description", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 112, + "database_schema_index": 1, + "natural_language_query": "Find clinics that are accepting new patients and calculate the mean of averagePatientSatisfaction scores for those clinics.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that are accepting new patients and calculate the mean of averagePatientSatisfaction scores for those clinics.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that are accepting new patients and calculate the mean of averagePatientSatisfaction scores for those clinics.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 113, + "database_schema_index": 1, + "natural_language_query": "Find clinics that are accepting new patients (using 'acceptingNewPatients' with true value), group the results by clinicName, and aggregate to count the occurrences of each clinic name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics that are accepting new patients (using 'acceptingNewPatients' with true value), group the results by clinicName, and aggregate to count the occurrences of each clinic name.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics that are accepting new patients (using 'acceptingNewPatients' with true value), group the results by clinicName, and aggregate to count the occurrences of each clinic name.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "clinicName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10000 + }, + "boolean_property_aggregation": null, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 114, + "database_schema_index": 1, + "natural_language_query": "Find all clinics where acceptingNewPatients is true, and count how many different clinics share the same description.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find all clinics where acceptingNewPatients is true, and count how many different clinics share the same description.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all clinics where acceptingNewPatients is true, and count how many different clinics share the same description.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10000 + }, + "boolean_property_aggregation": null, + "groupby_property": "description", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 115, + "database_schema_index": 1, + "natural_language_query": "Find and display the percentage of clinics that are currently accepting new patients, grouped by each clinic's name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find and display the percentage of clinics that are currently accepting new patients, grouped by each clinic's name.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find and display the percentage of clinics that are currently accepting new patients, grouped by each clinic's name.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 116, + "database_schema_index": 1, + "natural_language_query": "Find all appointments where appointmentConfirmed is false and also count the total number of appointments based on appointmentConfirmed status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find all appointments where appointmentConfirmed is false and also count the total number of appointments based on appointmentConfirmed status.", + "target_collection": "Appointments", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "appointmentConfirmed", + "operator": "=", + "value": false + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all appointments where appointmentConfirmed is false and also count the total number of appointments based on appointmentConfirmed status.", + "target_collection": "Appointments", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "appointmentConfirmed", + "operator": "=", + "value": false + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "appointmentConfirmed", + "metrics": "TOTAL_FALSE" + }, + "groupby_property": "appointmentConfirmed", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 117, + "database_schema_index": 1, + "natural_language_query": "Find all clinics that are accepting new patients and group them by clinicName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find all clinics that are accepting new patients and group them by clinicName.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all clinics that are accepting new patients and group them by clinicName.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "clinicName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 118, + "database_schema_index": 1, + "natural_language_query": "Find clinics where acceptingNewPatients is equal to true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Find clinics where acceptingNewPatients is equal to true.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find clinics where acceptingNewPatients is equal to true.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "acceptingNewPatients", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 119, + "database_schema_index": 1, + "natural_language_query": "Determine the mean years of experience for doctors, categorized by their expertise.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Determine the mean years of experience for doctors, categorized by their expertise.", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "expertise" + }, + "predicted_query": { + "corresponding_natural_language_query": "Determine the mean years of experience for doctors, categorized by their expertise.", + "target_collection": "Doctors", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "expertise", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 120, + "database_schema_index": 1, + "natural_language_query": "Using the int_property_aggregation operator, calculate the total number of years of experience across all doctors by summing the 'yearsOfExperience' property in the Doctors collection.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Using the int_property_aggregation operator, calculate the total number of years of experience across all doctors by summing the 'yearsOfExperience' property in the Doctors collection.", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Using the int_property_aggregation operator, calculate the total number of years of experience across all doctors by summing the 'yearsOfExperience' property in the Doctors collection.", + "target_collection": "Doctors", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 121, + "database_schema_index": 1, + "natural_language_query": "What are the top 5 most common areas of expertise for doctors, grouped by whether they are currently practicing?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "What are the top 5 most common areas of expertise for doctors, grouped by whether they are currently practicing?", + "target_collection": "Doctors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "expertise", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "currentlyPracticing" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the top 5 most common areas of expertise for doctors, grouped by whether they are currently practicing?", + "target_collection": "Doctors", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "areaOfExpertise", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "isCurrentlyPracticing", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.65, + "error": null + }, + { + "query_index": 122, + "database_schema_index": 1, + "natural_language_query": "What are the top 5 most common clinicName entries in the Clinics collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "What are the top 5 most common clinicName entries in the Clinics collection?", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "clinicName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the top 5 most common clinicName entries in the Clinics collection?", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "clinicName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 123, + "database_schema_index": 1, + "natural_language_query": "Calculate the percentage of clinics that are accepting new patients, grouped by their average patient satisfaction.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Calculate the percentage of clinics that are accepting new patients, grouped by their average patient satisfaction.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate the percentage of clinics that are accepting new patients, grouped by their average patient satisfaction.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averagePatientSatisfaction", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "averagePatientSatisfaction", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 124, + "database_schema_index": 1, + "natural_language_query": "How many clinics are currently accepting new patients compared to those that are not?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "How many clinics are currently accepting new patients compared to those that are not?", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "How many clinics are currently accepting new patients compared to those that are not?", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingNewPatients", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "acceptingNewPatients", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 125, + "database_schema_index": 1, + "natural_language_query": "Group clinics by their averagePatientSatisfaction scores to see the distribution of clinics based on patient satisfaction levels, organizing the results into different satisfaction categories.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Clinics", + "properties": [ + { + "name": "clinicName", + "data_type": [ + "string" + ], + "description": "The official name of the clinic." + }, + { + "name": "description", + "data_type": [ + "string" + ], + "description": "A detailed overview of the clinic, including specialties and services offered." + }, + { + "name": "averagePatientSatisfaction", + "data_type": [ + "number" + ], + "description": "The average patient satisfaction score for the clinic." + }, + { + "name": "acceptingNewPatients", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the clinic is currently accepting new patients." + } + ], + "envisioned_use_case_overview": "This schema aims to help users discover clinics based on services, specialties, and patient satisfaction. Semantic search can be used to find clinics by specific healthcare needs or service qualities." + }, + { + "name": "Doctors", + "properties": [ + { + "name": "doctorName", + "data_type": [ + "string" + ], + "description": "The full name of the doctor." + }, + { + "name": "expertise", + "data_type": [ + "string" + ], + "description": "A detailed description of the doctor's areas of medical expertise and specialties." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years of experience the doctor has." + }, + { + "name": "currentlyPracticing", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the doctor is currently practicing at any clinic." + } + ], + "envisioned_use_case_overview": "This schema supports finding doctors based on expertise and experience. With semantic search, users can match their health concerns to the right professionals by exploring detailed profiles." + }, + { + "name": "Appointments", + "properties": [ + { + "name": "patientName", + "data_type": [ + "string" + ], + "description": "The name of the patient who booked the appointment." + }, + { + "name": "appointmentNotes", + "data_type": [ + "string" + ], + "description": "Detailed notes about the appointment including purpose and any special requests." + }, + { + "name": "appointmentDuration", + "data_type": [ + "number" + ], + "description": "The duration of the appointment in minutes." + }, + { + "name": "appointmentConfirmed", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the appointment is confirmed." + } + ], + "envisioned_use_case_overview": "This schema is designed to manage and optimize booking experiences by allowing semantic searches for specific appointment details and patient booking patterns." + } + ] + }, + "corresponding_natural_language_query": "Group clinics by their averagePatientSatisfaction scores to see the distribution of clinics based on patient satisfaction levels, organizing the results into different satisfaction categories.", + "target_collection": "Clinics", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction" + }, + "predicted_query": { + "corresponding_natural_language_query": "Group clinics by their averagePatientSatisfaction scores to see the distribution of clinics based on patient satisfaction levels, organizing the results into different satisfaction categories.", + "target_collection": "Clinics", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "averagePatientSatisfaction", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 126, + "database_schema_index": 1, + "natural_language_query": "Show me students interested in 'learning algorithms' who have completed more than 20 completedCredits, aggregate the count of completedCredits for these students, and group the results by their enrolledFullTime status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Show me students interested in 'learning algorithms' who have completed more than 20 completedCredits, aggregate the count of completedCredits for these students, and group the results by their enrolledFullTime status.", + "target_collection": "Students", + "search_query": "learning algorithms", + "integer_property_filter": { + "property_name": "completedCredits", + "operator": ">", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "enrolledFullTime" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show me students interested in 'learning algorithms' who have completed more than 20 completedCredits, aggregate the count of completedCredits for these students, and group the results by their enrolledFullTime status.", + "target_collection": "Students", + "search_query": "learning algorithms", + "limit": 5, + "integer_property_filter": { + "property_name": "completedCredits", + "operator": ">", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "completedCredits", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "enrolledFullTime", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 127, + "database_schema_index": 1, + "natural_language_query": "Find students whose researchInterests include machine learning, filter those who have completedCredits of at least 30, and calculate the average completedCredits of these students.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find students whose researchInterests include machine learning, filter those who have completedCredits of at least 30, and calculate the average completedCredits of these students.", + "target_collection": "Students", + "search_query": "Find students whose researchInterests include machine learning", + "integer_property_filter": { + "property_name": "completedCredits", + "operator": ">=", + "value": 30 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "completedCredits", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find students whose researchInterests include machine learning, filter those who have completedCredits of at least 30, and calculate the average completedCredits of these students.", + "target_collection": "Students", + "search_query": "researchInterests include machine learning", + "limit": 5, + "integer_property_filter": { + "property_name": "completedCredits", + "operator": ">=", + "value": 30.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "completedCredits", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 128, + "database_schema_index": 2, + "natural_language_query": "Identify courses related to machine learning that have a courseDuration of at least 5 hours, and determine the most frequently occurring courseTitle.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify courses related to machine learning that have a courseDuration of at least 5 hours, and determine the most frequently occurring courseTitle.", + "target_collection": "Courses", + "search_query": "machine learning", + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": "" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify courses related to machine learning that have a courseDuration of at least 5 hours, and determine the most frequently occurring courseTitle.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 5.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 129, + "database_schema_index": 2, + "natural_language_query": "Find courses that semantically relate to data science and machine learning in their courseDescription, filter for those which courseDuration is at least 40 hours, and show the top 5 most common courseTitle values for these courses.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that semantically relate to data science and machine learning in their courseDescription, filter for those which courseDuration is at least 40 hours, and show the top 5 most common courseTitle values for these courses.", + "target_collection": "Courses", + "search_query": "data science and machine learning", + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 40 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that semantically relate to data science and machine learning in their courseDescription, filter for those which courseDuration is at least 40 hours, and show the top 5 most common courseTitle values for these courses.", + "target_collection": "Courses", + "search_query": "data science machine learning", + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 40.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 130, + "database_schema_index": 2, + "natural_language_query": "List all courses related to artificial intelligence and machine learning that require at least 20 hours to complete, show the percentage of those courses currently accepting enrollments, and categorize the results by whether they are currently enrolling or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "List all courses related to artificial intelligence and machine learning that require at least 20 hours to complete, show the percentage of those courses currently accepting enrollments, and categorize the results by whether they are currently enrolling or not.", + "target_collection": "Courses", + "search_query": "Find courses related to artificial intelligence and machine learning.", + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "List all courses related to artificial intelligence and machine learning that require at least 20 hours to complete, show the percentage of those courses currently accepting enrollments, and categorize the results by whether they are currently enrolling or not.", + "target_collection": "Courses", + "search_query": "artificial intelligence machine learning", + "limit": 5, + "integer_property_filter": { + "property_name": "duration", + "operator": ">=", + "value": 20.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "acceptingEnrollments", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "acceptingEnrollments", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.75, + "error": null + }, + { + "query_index": 131, + "database_schema_index": 2, + "natural_language_query": "Find courses that are similar to 'data science', have a courseDuration of 40 hours or less, and calculate the percentage of these courses that are currentlyEnrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that are similar to 'data science', have a courseDuration of 40 hours or less, and calculate the percentage of these courses that are currentlyEnrolling.", + "target_collection": "Courses", + "search_query": "Find courses similar to data science that enhance learning outcomes", + "integer_property_filter": { + "property_name": "courseDuration", + "operator": "<=", + "value": 40 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that are similar to 'data science', have a courseDuration of 40 hours or less, and calculate the percentage of these courses that are currentlyEnrolling.", + "target_collection": "Courses", + "search_query": "data science", + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": "<=", + "value": 40.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 132, + "database_schema_index": 2, + "natural_language_query": "Find students interested in machine learning who have completed at least 30 credits, grouped by whether they are enrolled full-time.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find students interested in machine learning who have completed at least 30 credits, grouped by whether they are enrolled full-time.", + "target_collection": "Students", + "search_query": "students interested in machine learning", + "integer_property_filter": { + "property_name": "completedCredits", + "operator": ">=", + "value": 30 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "enrolledFullTime" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find students interested in machine learning who have completed at least 30 credits, grouped by whether they are enrolled full-time.", + "target_collection": "Students", + "search_query": "interested in machine learning", + "limit": 5, + "integer_property_filter": { + "property_name": "creditsCompleted", + "operator": ">=", + "value": 30.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "enrolledFullTime", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 133, + "database_schema_index": 2, + "natural_language_query": "Find courses that relate to artificial intelligence which have a courseDuration of at least 20 hours.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that relate to artificial intelligence which have a courseDuration of at least 20 hours.", + "target_collection": "Courses", + "search_query": "Find courses related to artificial intelligence", + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that relate to artificial intelligence which have a courseDuration of at least 20 hours.", + "target_collection": "Courses", + "search_query": "artificial intelligence", + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 134, + "database_schema_index": 2, + "natural_language_query": "What is the average duration of courses related to artificial intelligence that are currently enrolling, and organize the results by course title?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the average duration of courses related to artificial intelligence that are currently enrolling, and organize the results by course title?", + "target_collection": "Courses", + "search_query": "artificial intelligence", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average duration of courses related to artificial intelligence that are currently enrolling, and organize the results by course title?", + "target_collection": "Courses", + "search_query": "artificial intelligence", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "duration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "title", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 135, + "database_schema_index": 2, + "natural_language_query": "Search for courses whose descriptions are conceptually similar to 'machine learning and artificial intelligence', filter to find courses with the exact courseTitle 'Introduction to AI', and calculate the average courseDuration of these courses.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Search for courses whose descriptions are conceptually similar to 'machine learning and artificial intelligence', filter to find courses with the exact courseTitle 'Introduction to AI', and calculate the average courseDuration of these courses.", + "target_collection": "Courses", + "search_query": "Find me the courses that cover topics similar to 'machine learning and artificial intelligence'.", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "=", + "value": "Introduction to AI" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for courses whose descriptions are conceptually similar to 'machine learning and artificial intelligence', filter to find courses with the exact courseTitle 'Introduction to AI', and calculate the average courseDuration of these courses.", + "target_collection": "Courses", + "search_query": "machine learning and artificial intelligence", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "=", + "value": "Introduction to AI" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 136, + "database_schema_index": 2, + "natural_language_query": "Find courses related to data science and machine learning by courseDescription, filter these courses to only those that are currently open for enrollment, count the unique course titles, and then group the courses by their duration to analyze the number of courses segmented by different durations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses related to data science and machine learning by courseDescription, filter these courses to only those that are currently open for enrollment, count the unique course titles, and then group the courses by their duration to analyze the number of courses segmented by different durations.", + "target_collection": "Courses", + "search_query": "Find courses related to data science and machine learning by courseDescription", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses related to data science and machine learning by courseDescription, filter these courses to only those that are currently open for enrollment, count the unique course titles, and then group the courses by their duration to analyze the number of courses segmented by different durations.", + "target_collection": "Courses", + "search_query": "data science machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "%data science machine learning%" + }, + "boolean_property_filter": { + "property_name": "openForEnrollment", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": "duration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.775, + "error": null + }, + { + "query_index": 137, + "database_schema_index": 2, + "natural_language_query": "Find courses that focus on machine learning that are currently enrolling, and display the top 5 most common course titles.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that focus on machine learning that are currently enrolling, and display the top 5 most common course titles.", + "target_collection": "Courses", + "search_query": "Find courses that focus on machine learning", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that focus on machine learning that are currently enrolling, and display the top 5 most common course titles.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "enrollmentStatus", + "operator": "=", + "value": "enrolling" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "title", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9, + "error": null + }, + { + "query_index": 138, + "database_schema_index": 2, + "natural_language_query": "Search for courses that focus on 'machine learning' topics, filter to include only those that have 'Data Science' in their course title, calculate the percentage of these courses that are currently enrolling, and group the results by course duration.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Search for courses that focus on 'machine learning' topics, filter to include only those that have 'Data Science' in their course title, calculate the percentage of these courses that are currently enrolling, and group the results by course duration.", + "target_collection": "Courses", + "search_query": "machine learning", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Data Science" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for courses that focus on 'machine learning' topics, filter to include only those that have 'Data Science' in their course title, calculate the percentage of these courses that are currently enrolling, and group the results by course duration.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Data Science" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseDuration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 139, + "database_schema_index": 2, + "natural_language_query": "Find instructors who are described as experienced in teaching computer science in their biography, specifically look for instructors named Jane Doe, and calculate the percentage of instructors who hold a tenured position in the 'tenured' field.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find instructors who are described as experienced in teaching computer science in their biography, specifically look for instructors named Jane Doe, and calculate the percentage of instructors who hold a tenured position in the 'tenured' field.", + "target_collection": "Instructors", + "search_query": "experienced in teaching computer science", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "instructorName", + "operator": "=", + "value": "Jane Doe" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "tenured", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find instructors who are described as experienced in teaching computer science in their biography, specifically look for instructors named Jane Doe, and calculate the percentage of instructors who hold a tenured position in the 'tenured' field.", + "target_collection": "Instructors", + "search_query": "experienced in teaching computer science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "Jane Doe" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "tenured", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 140, + "database_schema_index": 2, + "natural_language_query": "Find courses related to Python programming where the course title contains 'Introduction', and group the results by whether the courses are currently enrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses related to Python programming where the course title contains 'Introduction', and group the results by whether the courses are currently enrolling.", + "target_collection": "Courses", + "search_query": "Python programming", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "%Introduction%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses related to Python programming where the course title contains 'Introduction', and group the results by whether the courses are currently enrolling.", + "target_collection": "Courses", + "search_query": "Python programming", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "title", + "operator": "LIKE", + "value": "Introduction" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "isCurrentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 141, + "database_schema_index": 2, + "natural_language_query": "Show me courses that cover 'machine learning fundamentals' in their descriptions and have the word 'Advanced' in the course title.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Show me courses that cover 'machine learning fundamentals' in their descriptions and have the word 'Advanced' in the course title.", + "target_collection": "Courses", + "search_query": "Find courses that cover 'machine learning fundamentals' in courseDescription", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Advanced" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Show me courses that cover 'machine learning fundamentals' in their descriptions and have the word 'Advanced' in the course title.", + "target_collection": "Courses", + "search_query": "machine learning fundamentals", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "title", + "operator": "LIKE", + "value": "Advanced" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 142, + "database_schema_index": 2, + "natural_language_query": "Search for courses related to machine learning and deep learning that are currently open for enrollment, calculate the average duration of these courses, and categorize the results based on the enrollment status of the courses.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Search for courses related to machine learning and deep learning that are currently open for enrollment, calculate the average duration of these courses, and categorize the results based on the enrollment status of the courses.", + "target_collection": "Courses", + "search_query": "Find courses related to machine learning and deep learning exploration", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for courses related to machine learning and deep learning that are currently open for enrollment, calculate the average duration of these courses, and categorize the results based on the enrollment status of the courses.", + "target_collection": "Courses", + "search_query": "machine learning deep learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isOpenForEnrollment", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "duration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "isOpenForEnrollment", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.75, + "error": null + }, + { + "query_index": 143, + "database_schema_index": 2, + "natural_language_query": "What are the courses related to 'machine learning' that are currently enrolling, and what is the average course duration?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What are the courses related to 'machine learning' that are currently enrolling, and what is the average course duration?", + "target_collection": "Courses", + "search_query": "Find courses related to 'machine learning' based on courseDescription", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the courses related to 'machine learning' that are currently enrolling, and what is the average course duration?", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "duration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 144, + "database_schema_index": 2, + "natural_language_query": "Find courses related to \"machine learning\" in courseDescription that are currently enrolling, count the number of unique courses titles, and group the results by courseDuration.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses related to \"machine learning\" in courseDescription that are currently enrolling, count the number of unique courses titles, and group the results by courseDuration.", + "target_collection": "Courses", + "search_query": "Find courses related to \"machine learning\" in courseDescription", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses related to \"machine learning\" in courseDescription that are currently enrolling, count the number of unique courses titles, and group the results by courseDuration.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "%machine learning%" + }, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10000 + }, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 145, + "database_schema_index": 2, + "natural_language_query": "Find courses that are related to data science in courseDescription, are currently enrolling as indicated by currentlyEnrolling being true, and return the top 5 most popular course titles using courseTitle.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that are related to data science in courseDescription, are currently enrolling as indicated by currentlyEnrolling being true, and return the top 5 most popular course titles using courseTitle.", + "target_collection": "Courses", + "search_query": "Data Science", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that are related to data science in courseDescription, are currently enrolling as indicated by currentlyEnrolling being true, and return the top 5 most popular course titles using courseTitle.", + "target_collection": "Courses", + "search_query": "data science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 146, + "database_schema_index": 2, + "natural_language_query": "What are the currently enrolling courses related to 'machine learning applied techniques', and how is the enrollment status distributed across these courses by course title?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What are the currently enrolling courses related to 'machine learning applied techniques', and how is the enrollment status distributed across these courses by course title?", + "target_collection": "Courses", + "search_query": "Find courses related to 'machine learning applied techniques' in courseDescription", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the currently enrolling courses related to 'machine learning applied techniques', and how is the enrollment status distributed across these courses by course title?", + "target_collection": "Courses", + "search_query": "machine learning applied techniques", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isCurrentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isCurrentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 147, + "database_schema_index": 2, + "natural_language_query": "Find courses by topics related to artificial intelligence, filter to only include those that are currently open for enrollment, and calculate the percentage of total courses that are currently enrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses by topics related to artificial intelligence, filter to only include those that are currently open for enrollment, and calculate the percentage of total courses that are currently enrolling.", + "target_collection": "Courses", + "search_query": "Find courses by topics related to artificial intelligence", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses by topics related to artificial intelligence, filter to only include those that are currently open for enrollment, and calculate the percentage of total courses that are currently enrolling.", + "target_collection": "Courses", + "search_query": "artificial intelligence", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openForEnrollment", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openForEnrollment", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9, + "error": null + }, + { + "query_index": 148, + "database_schema_index": 2, + "natural_language_query": "Find courses related to data science that are currently enrolling, and group these courses by their courseDuration to see how they vary by length.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses related to data science that are currently enrolling, and group these courses by their courseDuration to see how they vary by length.", + "target_collection": "Courses", + "search_query": "Find courses with subjects related to 'data science'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses related to data science that are currently enrolling, and group these courses by their courseDuration to see how they vary by length.", + "target_collection": "Courses", + "search_query": "data science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 149, + "database_schema_index": 2, + "natural_language_query": "Find courses with topics related to 'machine learning techniques' that are currently enrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses with topics related to 'machine learning techniques' that are currently enrolling.", + "target_collection": "Courses", + "search_query": "Find courses with topics related to 'machine learning techniques'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses with topics related to 'machine learning techniques' that are currently enrolling.", + "target_collection": "Courses", + "search_query": "machine learning techniques", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 150, + "database_schema_index": 2, + "natural_language_query": "What is the average course duration of courses related to 'machine learning fundamentals', and how does it vary between courses that are currently enrolling and those that are not?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the average course duration of courses related to 'machine learning fundamentals', and how does it vary between courses that are currently enrolling and those that are not?", + "target_collection": "Courses", + "search_query": "Find courses that match the phrase 'machine learning fundamentals'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average course duration of courses related to 'machine learning fundamentals', and how does it vary between courses that are currently enrolling and those that are not?", + "target_collection": "Courses", + "search_query": "machine learning fundamentals", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "duration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 151, + "database_schema_index": 2, + "natural_language_query": "Find courses that are conceptually similar to 'data science' and calculate the average course duration in courseDuration.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that are conceptually similar to 'data science' and calculate the average course duration in courseDuration.", + "target_collection": "Courses", + "search_query": "Find courses that best match the concept of 'data science'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that are conceptually similar to 'data science' and calculate the average course duration in courseDuration.", + "target_collection": "Courses", + "search_query": "data science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 152, + "database_schema_index": 2, + "natural_language_query": "Find students who have research interests similar to quantum computing and determine the count of unique research interests, while grouping the results by whether they are enrolled full-time.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find students who have research interests similar to quantum computing and determine the count of unique research interests, while grouping the results by whether they are enrolled full-time.", + "target_collection": "Students", + "search_query": "quantum computing", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "enrolledFullTime" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find students who have research interests similar to quantum computing and determine the count of unique research interests, while grouping the results by whether they are enrolled full-time.", + "target_collection": "Students", + "search_query": "quantum computing", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "researchInterests", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10 + }, + "boolean_property_aggregation": null, + "groupby_property": "enrolledFullTime", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 153, + "database_schema_index": 2, + "natural_language_query": "Find courses that are conceptually similar to 'machine learning', are currently enrolling, and identify the top 3 most common course titles.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that are conceptually similar to 'machine learning', are currently enrolling, and identify the top 3 most common course titles.", + "target_collection": "Courses", + "search_query": "Find courses related to 'machine learning' that are open for enrollment", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that are conceptually similar to 'machine learning', are currently enrolling, and identify the top 3 most common course titles.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "status", + "operator": "=", + "value": "enrolling" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "title", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 3 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 154, + "database_schema_index": 2, + "natural_language_query": "Find the most relevant students based on research interests around 'machine learning', calculate the percentage of those students enrolled full-time, and group the results by their research interests.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find the most relevant students based on research interests around 'machine learning', calculate the percentage of those students enrolled full-time, and group the results by their research interests.", + "target_collection": "Students", + "search_query": "Find the most relevant students based on research interests around 'machine learning'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "enrolledFullTime", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "researchInterests" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the most relevant students based on research interests around 'machine learning', calculate the percentage of those students enrolled full-time, and group the results by their research interests.", + "target_collection": "Students", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "enrolledFullTime", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "researchInterests", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 155, + "database_schema_index": 2, + "natural_language_query": "Find the number of courses with courseTitle or courseDescription related to 'Data Science', and summarize how many of these courses are currently open for enrollment.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find the number of courses with courseTitle or courseDescription related to 'Data Science', and summarize how many of these courses are currently open for enrollment.", + "target_collection": "Courses", + "search_query": "Data Science", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the number of courses with courseTitle or courseDescription related to 'Data Science', and summarize how many of these courses are currently open for enrollment.", + "target_collection": "Courses", + "search_query": "Data Science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "totalCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isOpenForEnrollment", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 156, + "database_schema_index": 2, + "natural_language_query": "Find courses whose courseDescription is similar to 'machine learning foundations' and group these courses by their currentlyEnrolling status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses whose courseDescription is similar to 'machine learning foundations' and group these courses by their currentlyEnrolling status.", + "target_collection": "Courses", + "search_query": "Find courses whose courseDescription is similar to 'machine learning foundations'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses whose courseDescription is similar to 'machine learning foundations' and group these courses by their currentlyEnrolling status.", + "target_collection": "Courses", + "search_query": "machine learning foundations", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 157, + "database_schema_index": 2, + "natural_language_query": "Find courses with a courseDescription that covers the entire data science lifecycle, including data collection, processing, analysis, and presentation.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses with a courseDescription that covers the entire data science lifecycle, including data collection, processing, analysis, and presentation.", + "target_collection": "Courses", + "search_query": "Find courses that cover the entire data science lifecycle, including data collection, processing, analysis, and presentation.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses with a courseDescription that covers the entire data science lifecycle, including data collection, processing, analysis, and presentation.", + "target_collection": "Courses", + "search_query": "data science lifecycle including data collection, processing, analysis, and presentation", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 158, + "database_schema_index": 2, + "natural_language_query": "Count the number of instructors grouped by tenured status who have at least 10 years in yearsOfTeaching.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Count the number of instructors grouped by tenured status who have at least 10 years in yearsOfTeaching.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured" + }, + "predicted_query": { + "corresponding_natural_language_query": "Count the number of instructors grouped by tenured status who have at least 10 years in yearsOfTeaching.", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 159, + "database_schema_index": 2, + "natural_language_query": "Find the total number of instructors who have been teaching for at least 10 years based on their yearsOfTeaching.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find the total number of instructors who have been teaching for at least 10 years based on their yearsOfTeaching.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the total number of instructors who have been teaching for at least 10 years based on their yearsOfTeaching.", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 160, + "database_schema_index": 2, + "natural_language_query": "Identify instructors who have been teaching for at least 10 years. For these instructors, summarize how frequently different words appear in their biography, and categorize them based on whether they hold tenured positions.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify instructors who have been teaching for at least 10 years. For these instructors, summarize how frequently different words appear in their biography, and categorize them based on whether they hold tenured positions.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify instructors who have been teaching for at least 10 years. For these instructors, summarize how frequently different words appear in their biography, and categorize them based on whether they hold tenured positions.", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsTeaching", + "operator": ">=", + "value": 10.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "biography", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10 + }, + "boolean_property_aggregation": null, + "groupby_property": "isTenured", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 161, + "database_schema_index": 2, + "natural_language_query": "Find instructors who have at least 10 yearsOfTeaching and determine the top 5 most common attributes mentioned in their biography.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find instructors who have at least 10 yearsOfTeaching and determine the top 5 most common attributes mentioned in their biography.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "biography", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find instructors who have at least 10 yearsOfTeaching and determine the top 5 most common attributes mentioned in their biography.", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "biography", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 162, + "database_schema_index": 2, + "natural_language_query": "Find all instructors with more than 5 years in yearsOfTeaching, show the count of tenured status and group the results by instructorName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find all instructors with more than 5 years in yearsOfTeaching, show the count of tenured status and group the results by instructorName.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "instructorName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all instructors with more than 5 years in yearsOfTeaching, show the count of tenured status and group the results by instructorName.", + "target_collection": "Instructors", + "search_query": "", + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">", + "value": 5.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "tenured", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "instructorName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 163, + "database_schema_index": 2, + "natural_language_query": "Find courses with a courseDuration of at least 20 hours and determine how many of these are currently enrolling by counting the boolean currentlyEnrolling field.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses with a courseDuration of at least 20 hours and determine how many of these are currently enrolling by counting the boolean currentlyEnrolling field.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses with a courseDuration of at least 20 hours and determine how many of these are currently enrolling by counting the boolean currentlyEnrolling field.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">=", + "value": 20.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 164, + "database_schema_index": 2, + "natural_language_query": "Identify instructors who have more than 10 years of teaching experience and group them by whether they hold a tenured position.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify instructors who have more than 10 years of teaching experience and group them by whether they hold a tenured position.", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfTeaching", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify instructors who have more than 10 years of teaching experience and group them by whether they hold a tenured position.", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "isTenured", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 165, + "database_schema_index": 2, + "natural_language_query": "Find courses that have a courseDuration greater than 10 hours.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that have a courseDuration greater than 10 hours.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that have a courseDuration greater than 10 hours.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "courseDuration", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 166, + "database_schema_index": 2, + "natural_language_query": "Find all courses containing 'machine learning' in the courseDescription, then group them by currentlyEnrolling status and determine the maximum courseDuration in each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find all courses containing 'machine learning' in the courseDescription, then group them by currentlyEnrolling status and determine the maximum courseDuration in each group.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "machine learning" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all courses containing 'machine learning' in the courseDescription, then group them by currentlyEnrolling status and determine the maximum courseDuration in each group.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "%machine learning%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 167, + "database_schema_index": 2, + "natural_language_query": "Find the average courseDuration of all courses that have 'Python' in their courseDescription.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find the average courseDuration of all courses that have 'Python' in their courseDescription.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "Python" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the average courseDuration of all courses that have 'Python' in their courseDescription.", + "target_collection": "Courses", + "search_query": "Python", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "%Python%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 168, + "database_schema_index": 2, + "natural_language_query": "Identify whether courses that mention 'machine learning' in their courseDescription are currently enrolling, group these courses by their currentlyEnrolling status, and list the top 5 most common courseTitles for each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify whether courses that mention 'machine learning' in their courseDescription are currently enrolling, group these courses by their currentlyEnrolling status, and list the top 5 most common courseTitles for each group.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "machine learning" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify whether courses that mention 'machine learning' in their courseDescription are currently enrolling, group these courses by their currentlyEnrolling status, and list the top 5 most common courseTitles for each group.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "machine learning" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 169, + "database_schema_index": 2, + "natural_language_query": "Find and count courses with 'data science' in the courseDescription by using the courseDescription text_property_filter with LIKE, and count the total number of different course titles using courseTitle text_property_aggregation COUNT.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find and count courses with 'data science' in the courseDescription by using the courseDescription text_property_filter with LIKE, and count the total number of different course titles using courseTitle text_property_aggregation COUNT.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "data science" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find and count courses with 'data science' in the courseDescription by using the courseDescription text_property_filter with LIKE, and count the total number of different course titles using courseTitle text_property_aggregation COUNT.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "data science" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1000000 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 170, + "database_schema_index": 2, + "natural_language_query": "Identify all courses that include 'Data Science' in their courseTitle, count how many of these courses are currentlyEnrolling, and group the results by courseDuration to show how courses of different durations are distributed.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify all courses that include 'Data Science' in their courseTitle, count how many of these courses are currentlyEnrolling, and group the results by courseDuration to show how courses of different durations are distributed.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Data Science" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify all courses that include 'Data Science' in their courseTitle, count how many of these courses are currentlyEnrolling, and group the results by courseDuration to show how courses of different durations are distributed.", + "target_collection": "Courses", + "search_query": "Data Science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "%Data Science%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "courseDuration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 171, + "database_schema_index": 2, + "natural_language_query": "Find courses where the courseTitle contains 'Advanced' and calculate the percentage of these that are currentlyEnrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses where the courseTitle contains 'Advanced' and calculate the percentage of these that are currentlyEnrolling.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Advanced" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses where the courseTitle contains 'Advanced' and calculate the percentage of these that are currentlyEnrolling.", + "target_collection": "Courses", + "search_query": "Advanced", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "%Advanced%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 172, + "database_schema_index": 2, + "natural_language_query": "Find courses containing 'Introduction to Data Science' in the courseTitle, and group the results by currentlyEnrolling status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses containing 'Introduction to Data Science' in the courseTitle, and group the results by currentlyEnrolling status.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseTitle", + "operator": "LIKE", + "value": "Introduction to Data Science" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses containing 'Introduction to Data Science' in the courseTitle, and group the results by currentlyEnrolling status.", + "target_collection": "Courses", + "search_query": "Introduction to Data Science", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 173, + "database_schema_index": 2, + "natural_language_query": "Find courses where the courseDescription includes the phrase 'machine learning'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses where the courseDescription includes the phrase 'machine learning'.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "machine learning" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses where the courseDescription includes the phrase 'machine learning'.", + "target_collection": "Courses", + "search_query": "machine learning", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "courseDescription", + "operator": "LIKE", + "value": "machine learning" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 174, + "database_schema_index": 2, + "natural_language_query": "Find courses that are currently enrolling and group them by courseTitle, calculating the total sum of courseDuration for each courseTitle.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses that are currently enrolling and group them by courseTitle, calculating the total sum of courseDuration for each courseTitle.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses that are currently enrolling and group them by courseTitle, calculating the total sum of courseDuration for each courseTitle.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 175, + "database_schema_index": 2, + "natural_language_query": "What is the total number of hours required to complete all courses that are currently open for enrollment?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the total number of hours required to complete all courses that are currently open for enrollment?", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "courseDuration", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the total number of hours required to complete all courses that are currently open for enrollment?", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isOpenForEnrollment", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "totalHours", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9, + "error": null + }, + { + "query_index": 176, + "database_schema_index": 2, + "natural_language_query": "Identify courses that are currently open for enrollment (using currentlyEnrolling = true), and group them by courseDuration while aggregating the top 5 most common courseTitle values.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Identify courses that are currently open for enrollment (using currentlyEnrolling = true), and group them by courseDuration while aggregating the top 5 most common courseTitle values.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify courses that are currently open for enrollment (using currentlyEnrolling = true), and group them by courseDuration while aggregating the top 5 most common courseTitle values.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "courseDuration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 177, + "database_schema_index": 2, + "natural_language_query": "Retrieve courses that are currentlyEnrolling and count the number of unique courseTitle entries to understand how many different courses are currently open for enrollment.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Retrieve courses that are currentlyEnrolling and count the number of unique courseTitle entries to understand how many different courses are currently open for enrollment.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Retrieve courses that are currentlyEnrolling and count the number of unique courseTitle entries to understand how many different courses are currently open for enrollment.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10000 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 178, + "database_schema_index": 2, + "natural_language_query": "Find courses where currentlyEnrolling is true, calculate the percentage of such courses, and group the results by courseTitle to see enrollment status per course.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses where currentlyEnrolling is true, calculate the percentage of such courses, and group the results by courseTitle to see enrollment status per course.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses where currentlyEnrolling is true, calculate the percentage of such courses, and group the results by courseTitle to see enrollment status per course.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 179, + "database_schema_index": 2, + "natural_language_query": "Find all courses that are currently open for enrollment and calculate the total number of courses where the currentlyEnrolling property is true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find all courses that are currently open for enrollment and calculate the total number of courses where the currentlyEnrolling property is true.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all courses that are currently open for enrollment and calculate the total number of courses where the currentlyEnrolling property is true.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 180, + "database_schema_index": 2, + "natural_language_query": "Find all course titles where courses are currently enrolling and group the results by course title.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find all course titles where courses are currently enrolling and group the results by course title.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all course titles where courses are currently enrolling and group the results by course title.", + "target_collection": "Courses", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "courseTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 181, + "database_schema_index": 2, + "natural_language_query": "Find courses where currentlyEnrolling is true", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Find courses where currentlyEnrolling is true", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find courses where currentlyEnrolling is true", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyEnrolling", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 182, + "database_schema_index": 2, + "natural_language_query": "What is the average yearsOfTeaching of instructors, grouped by their tenured status?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the average yearsOfTeaching of instructors, grouped by their tenured status?", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfTeaching", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average yearsOfTeaching of instructors, grouped by their tenured status?", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfTeaching", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 183, + "database_schema_index": 2, + "natural_language_query": "What is the average and maximum number of years instructors have been teaching in the yearsOfTeaching property of the Instructors collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the average and maximum number of years instructors have been teaching in the yearsOfTeaching property of the Instructors collection?", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfTeaching", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "src.models.IntAggregation() argument after ** must be a mapping, not list" + }, + { + "query_index": 184, + "database_schema_index": 2, + "natural_language_query": "What is the count of each unique courseTitle for Courses, grouped by their currentlyEnrolling status?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the count of each unique courseTitle for Courses, grouped by their currentlyEnrolling status?", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyEnrolling" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 185, + "database_schema_index": 2, + "natural_language_query": "Count unique courseTitle values and find the top 5 most common course titles.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Count unique courseTitle values and find the top 5 most common course titles.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "courseTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 186, + "database_schema_index": 2, + "natural_language_query": "What percentage of courses are currently open for enrollment and how are these courses grouped by course duration?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What percentage of courses are currently open for enrollment and how are these courses grouped by course duration?", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyEnrolling", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseDuration" + }, + "predicted_query": { + "corresponding_natural_language_query": "What percentage of courses are currently open for enrollment and how are these courses grouped by course duration?", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openForEnrollment", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "courseDuration", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 187, + "database_schema_index": 2, + "natural_language_query": "Calculate how many courses in the Courses collection are currently open for enrollment, and determine the percentage of courses that are currently enrolling.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "Calculate how many courses in the Courses collection are currently open for enrollment, and determine the percentage of courses that are currently enrolling.", + "target_collection": "Courses", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate how many courses in the Courses collection are currently open for enrollment, and determine the percentage of courses that are currently enrolling.", + "target_collection": "Courses", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openForEnrollment", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openForEnrollment", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 188, + "database_schema_index": 2, + "natural_language_query": "What is the average years of teaching for instructors grouped by their tenured status using groupby on tenured?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Courses", + "properties": [ + { + "name": "courseTitle", + "data_type": [ + "string" + ], + "description": "The title of the course." + }, + { + "name": "courseDescription", + "data_type": [ + "string" + ], + "description": "A detailed summary of the course, including coverage topics and learning outcomes." + }, + { + "name": "courseDuration", + "data_type": [ + "number" + ], + "description": "The total number of hours required to complete the course." + }, + { + "name": "currentlyEnrolling", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the course is currently open for enrollment." + } + ], + "envisioned_use_case_overview": "This schema helps users find courses based on subject matter, duration, and enrollment status. Semantic search enhances discovery of courses by learning outcomes and topics covered." + }, + { + "name": "Instructors", + "properties": [ + { + "name": "instructorName", + "data_type": [ + "string" + ], + "description": "The full name of the instructor." + }, + { + "name": "biography", + "data_type": [ + "string" + ], + "description": "A detailed biography of the instructor, including professional background and teaching philosophy." + }, + { + "name": "yearsOfTeaching", + "data_type": [ + "number" + ], + "description": "The number of years the instructor has been teaching." + }, + { + "name": "tenured", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the instructor holds a tenured position." + } + ], + "envisioned_use_case_overview": "This schema allows students and administrators to search for instructors based on experience and background. Rich biographies help in matching students with instructors who align with their learning style and academic goals." + }, + { + "name": "Students", + "properties": [ + { + "name": "studentName", + "data_type": [ + "string" + ], + "description": "The full name of the student." + }, + { + "name": "researchInterests", + "data_type": [ + "string" + ], + "description": "Detailed information on the student's academic interests and research focus." + }, + { + "name": "completedCredits", + "data_type": [ + "number" + ], + "description": "The number of academic credits the student has completed." + }, + { + "name": "enrolledFullTime", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the student is enrolled full-time." + } + ], + "envisioned_use_case_overview": "This schema is designed to help institutions manage student data and preferences. Semantic search allows deeper insights into student research interests and progression paths." + } + ] + }, + "corresponding_natural_language_query": "What is the average years of teaching for instructors grouped by their tenured status using groupby on tenured?", + "target_collection": "Instructors", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average years of teaching for instructors grouped by their tenured status using groupby on tenured?", + "target_collection": "Instructors", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfTeaching", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "tenured", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 189, + "database_schema_index": 2, + "natural_language_query": "What is the average packagePrice of travel packages whose packageDetails correspond to 'tropical beach relaxation' and have a price less than $1500, grouped by whether a discount is available?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What is the average packagePrice of travel packages whose packageDetails correspond to 'tropical beach relaxation' and have a price less than $1500, grouped by whether a discount is available?", + "target_collection": "TravelPackages", + "search_query": "Find travel packages whose packageDetails match 'tropical beach relaxation'", + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average packagePrice of travel packages whose packageDetails correspond to 'tropical beach relaxation' and have a price less than $1500, grouped by whether a discount is available?", + "target_collection": "TravelPackages", + "search_query": "tropical beach relaxation", + "limit": 5, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<", + "value": 1500.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 190, + "database_schema_index": 2, + "natural_language_query": "Find travel destinations that are related to exotic beaches and vibrant nightlife but have an averageVisitCost of no more than $1500. Additionally, determine the maximum averageVisitCost among destinations that are popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that are related to exotic beaches and vibrant nightlife but have an averageVisitCost of no more than $1500. Additionally, determine the maximum averageVisitCost among destinations that are popular.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations related to exotic beaches and vibrant nightlife from destinationDescription", + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that are related to exotic beaches and vibrant nightlife but have an averageVisitCost of no more than $1500. Additionally, determine the maximum averageVisitCost among destinations that are popular.", + "target_collection": "TravelDestinations", + "search_query": "exotic beaches vibrant nightlife", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500.0 + }, + "text_property_filter": { + "property_name": "popularity", + "operator": "LIKE", + "value": "popular" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 191, + "database_schema_index": 2, + "natural_language_query": "Find destinations where the description includes 'hot and sunny beaches with vibrant nightlife', the averageVisitCost is less than or equal to 1500, count how many destinations are popular, and group the results by destinationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find destinations where the description includes 'hot and sunny beaches with vibrant nightlife', the averageVisitCost is less than or equal to 1500, count how many destinations are popular, and group the results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "hot and sunny beaches with vibrant nightlife", + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find destinations where the description includes 'hot and sunny beaches with vibrant nightlife', the averageVisitCost is less than or equal to 1500, count how many destinations are popular, and group the results by destinationName.", + "target_collection": "Destinations", + "search_query": "hot and sunny beaches with vibrant nightlife", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 192, + "database_schema_index": 3, + "natural_language_query": "Find travel packages that include safaris and beaches with a packagePrice less than 1000. Also, count how many times each packageName appears in the results.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel packages that include safaris and beaches with a packagePrice less than 1000. Also, count how many times each packageName appears in the results.", + "target_collection": "TravelPackages", + "search_query": "Find travel packages that include safaris and beaches", + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<", + "value": 1000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel packages that include safaris and beaches with a packagePrice less than 1000. Also, count how many times each packageName appears in the results.", + "target_collection": "TravelPackages", + "search_query": "safaris and beaches", + "limit": 5, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<", + "value": 1000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "packageName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1000000 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 193, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that offer peaceful beach vacations, where the averageVisitCost is less than or equal to 1500, count how many of these are popular, and group the results by destinationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that offer peaceful beach vacations, where the averageVisitCost is less than or equal to 1500, count how many of these are popular, and group the results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations that offer peaceful beach vacations", + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that offer peaceful beach vacations, where the averageVisitCost is less than or equal to 1500, count how many of these are popular, and group the results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "peaceful beach vacations", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "popularity", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10 + }, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 194, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations with beautiful beaches and rich cultural experiences where the averageVisitCost is no more than 1500, and determine what percentage of these destinations are currently popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations with beautiful beaches and rich cultural experiences where the averageVisitCost is no more than 1500, and determine what percentage of these destinations are currently popular.", + "target_collection": "TravelDestinations", + "search_query": "I want to find travel destinations with beautiful beaches and rich cultural experiences.", + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations with beautiful beaches and rich cultural experiences where the averageVisitCost is no more than 1500, and determine what percentage of these destinations are currently popular.", + "target_collection": "TravelDestinations", + "search_query": "beautiful beaches and rich cultural experiences", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitCost", + "operator": "<=", + "value": 1500.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyPopular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 195, + "database_schema_index": 3, + "natural_language_query": "Search for a relaxing vacation package that includes beach activities and cultural tours, filter for packages with a packagePrice greater than 2000, and organize the results based on whether a discount is available, using discountAvailable as the grouping property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Search for a relaxing vacation package that includes beach activities and cultural tours, filter for packages with a packagePrice greater than 2000, and organize the results based on whether a discount is available, using discountAvailable as the grouping property.", + "target_collection": "TravelPackages", + "search_query": "A relaxing vacation package with beach activities and cultural tours", + "integer_property_filter": { + "property_name": "packagePrice", + "operator": ">", + "value": 2000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for a relaxing vacation package that includes beach activities and cultural tours, filter for packages with a packagePrice greater than 2000, and organize the results based on whether a discount is available, using discountAvailable as the grouping property.", + "target_collection": "VacationPackages", + "search_query": "relaxing vacation package beach activities cultural tours", + "limit": 5, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": ">", + "value": 2000.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 196, + "database_schema_index": 3, + "natural_language_query": "Find travel packages described as a 'relaxing beach holiday' with a packagePrice of at most $500.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel packages described as a 'relaxing beach holiday' with a packagePrice of at most $500.", + "target_collection": "TravelPackages", + "search_query": "Find travel packages described as a 'relaxing beach holiday'.", + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<=", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel packages described as a 'relaxing beach holiday' with a packagePrice of at most $500.", + "target_collection": "TravelPackages", + "search_query": "relaxing beach holiday", + "limit": 5, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<=", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 197, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations with descriptions similar to 'beach and cultural experiences', filter for destinations named Bali, calculate the average of averageVisitCost, and group by whether destinations are popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations with descriptions similar to 'beach and cultural experiences', filter for destinations named Bali, calculate the average of averageVisitCost, and group by whether destinations are popular.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations with descriptions similar to 'beach and cultural experiences'", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "=", + "value": "Bali" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations with descriptions similar to 'beach and cultural experiences', filter for destinations named Bali, calculate the average of averageVisitCost, and group by whether destinations are popular.", + "target_collection": "TravelDestinations", + "search_query": "beach and cultural experiences", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "Bali" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "isPopular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 198, + "database_schema_index": 3, + "natural_language_query": "Find destinations whose descriptions semantically emphasize beautiful landscapes, specifically retrieve destinations named \"Bora Bora\", and determine the maximum average visit cost among all destinations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find destinations whose descriptions semantically emphasize beautiful landscapes, specifically retrieve destinations named \"Bora Bora\", and determine the maximum average visit cost among all destinations.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations with descriptions that emphasize beautiful landscapes", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "=", + "value": "Bora Bora" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find destinations whose descriptions semantically emphasize beautiful landscapes, specifically retrieve destinations named \"Bora Bora\", and determine the maximum average visit cost among all destinations.", + "target_collection": "Destinations", + "search_query": "beautiful landscapes", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "=", + "value": "Bora Bora" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 199, + "database_schema_index": 3, + "natural_language_query": "Find the most frequently occurring travel destinations that are popular among tourists, and match the phrase 'tropical beaches with vibrant nightlife', grouping them by their names and aggregating the count of each destination name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find the most frequently occurring travel destinations that are popular among tourists, and match the phrase 'tropical beaches with vibrant nightlife', grouping them by their names and aggregating the count of each destination name.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that match the phrase 'tropical beaches with vibrant nightlife'", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "popular", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the most frequently occurring travel destinations that are popular among tourists, and match the phrase 'tropical beaches with vibrant nightlife', grouping them by their names and aggregating the count of each destination name.", + "target_collection": "TravelDestinations", + "search_query": "tropical beaches with vibrant nightlife", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10 + }, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 200, + "database_schema_index": 3, + "natural_language_query": "Find destinations with tropical experiences as described in the destinationDescription, locate destinations that have 'Beach' included in the destinationName, and count how many destinations are currently marked as popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find destinations with tropical experiences as described in the destinationDescription, locate destinations that have 'Beach' included in the destinationName, and count how many destinations are currently marked as popular.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations with tropical experiences in destinationDescription", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "Beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find destinations with tropical experiences as described in the destinationDescription, locate destinations that have 'Beach' included in the destinationName, and count how many destinations are currently marked as popular.", + "target_collection": "Destinations", + "search_query": "tropical experiences", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "%Beach%" + }, + "boolean_property_filter": { + "property_name": "isPopular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 201, + "database_schema_index": 3, + "natural_language_query": "Find destinations with a description similar to 'scenic views', filter those with 'island' in their destinationName, group results by destinationName, and calculate the percentage of popular destinations within each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find destinations with a description similar to 'scenic views', filter those with 'island' in their destinationName, group results by destinationName, and calculate the percentage of popular destinations within each group.", + "target_collection": "TravelDestinations", + "search_query": "scenic views", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "%island%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find destinations with a description similar to 'scenic views', filter those with 'island' in their destinationName, group results by destinationName, and calculate the percentage of popular destinations within each group.", + "target_collection": "Destinations", + "search_query": "scenic views", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "island" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isPopular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 202, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that are relevant to a charming winter holiday experience with various activities. Additionally, filter results to include only destinations named 'Swiss Alps', and count how many of these destinations are currently popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that are relevant to a charming winter holiday experience with various activities. Additionally, filter results to include only destinations named 'Swiss Alps', and count how many of these destinations are currently popular.", + "target_collection": "TravelDestinations", + "search_query": "I am looking for a charming winter holiday experience with various activities.", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "=", + "value": "Swiss Alps" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that are relevant to a charming winter holiday experience with various activities. Additionally, filter results to include only destinations named 'Swiss Alps', and count how many of these destinations are currently popular.", + "target_collection": "TravelDestinations", + "search_query": "charming winter holiday experience with various activities", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "Swiss Alps" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 203, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that offer a cultural experience in their description, include 'Paris' in the destination name, and group the results by whether they are currently popular among tourists.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that offer a cultural experience in their description, include 'Paris' in the destination name, and group the results by whether they are currently popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": "A cultural experience", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "%Paris%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that offer a cultural experience in their description, include 'Paris' in the destination name, and group the results by whether they are currently popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": "cultural experience", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "Paris" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "isPopularAmongTourists", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 204, + "database_schema_index": 3, + "natural_language_query": "Find travel packages that are conceptually similar to a relaxing beach vacation and have 'Caribbean' in the packageName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel packages that are conceptually similar to a relaxing beach vacation and have 'Caribbean' in the packageName.", + "target_collection": "TravelPackages", + "search_query": "relaxing beach vacation", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "packageName", + "operator": "LIKE", + "value": "Caribbean" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel packages that are conceptually similar to a relaxing beach vacation and have 'Caribbean' in the packageName.", + "target_collection": "TravelPackages", + "search_query": "relaxing beach vacation", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "packageName", + "operator": "LIKE", + "value": "Caribbean" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 205, + "database_schema_index": 3, + "natural_language_query": "Search for travel destinations with scenic beaches and vibrant local culture, filter for those that are currently popular, calculate the average cost to visit, and group by destination name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Search for travel destinations with scenic beaches and vibrant local culture, filter for those that are currently popular, calculate the average cost to visit, and group by destination name.", + "target_collection": "TravelDestinations", + "search_query": "Scenic beaches with vibrant local culture", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for travel destinations with scenic beaches and vibrant local culture, filter for those that are currently popular, calculate the average cost to visit, and group by destination name.", + "target_collection": "TravelDestinations", + "search_query": "scenic beaches and vibrant local culture", + "limit": 5, + "integer_property_filter": { + "property_name": "popularity", + "operator": ">", + "value": 80.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "costToVisit", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 206, + "database_schema_index": 3, + "natural_language_query": "Identify popular travel destinations described as tropical beaches and places with rich cultural history, and compute the average cost of visiting these popular locations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Identify popular travel destinations described as tropical beaches and places with rich cultural history, and compute the average cost of visiting these popular locations.", + "target_collection": "TravelDestinations", + "search_query": "Find tropical beaches and cultural destinations with rich histories.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify popular travel destinations described as tropical beaches and places with rich cultural history, and compute the average cost of visiting these popular locations.", + "target_collection": "TravelDestinations", + "search_query": "tropical beaches rich cultural history", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "visitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.925, + "error": null + }, + { + "query_index": 207, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations related to beach vacations that are popular, categorize them by destinationName, and identify the top 5 most common destination names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations related to beach vacations that are popular, categorize them by destinationName, and identify the top 5 most common destination names.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations related to beach vacations", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations related to beach vacations that are popular, categorize them by destinationName, and identify the top 5 most common destination names.", + "target_collection": "TravelDestinations", + "search_query": "beach vacations", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "popularity", + "operator": "LIKE", + "value": "popular" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 208, + "database_schema_index": 3, + "natural_language_query": "Find the most relevant travel destinations with scenic beaches and vibrant nightlife among those that are currently popular, and count how many travel destinations are there.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find the most relevant travel destinations with scenic beaches and vibrant nightlife among those that are currently popular, and count how many travel destinations are there.", + "target_collection": "TravelDestinations", + "search_query": "description: 'Describe destinations with scenic beaches and vibrant nightlife'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the most relevant travel destinations with scenic beaches and vibrant nightlife among those that are currently popular, and count how many travel destinations are there.", + "target_collection": "TravelDestinations", + "search_query": "scenic beaches vibrant nightlife", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "popularity", + "operator": "LIKE", + "value": "currently popular" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 209, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that match 'tropical beaches with vibrant cultures' in their destinationDescription, filter them to show only those that are currently popular, calculate the percentage of destinations that are popular, and group the results by destinationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that match 'tropical beaches with vibrant cultures' in their destinationDescription, filter them to show only those that are currently popular, calculate the percentage of destinations that are popular, and group the results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that match 'tropical beaches with vibrant cultures' in destinationDescription", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that match 'tropical beaches with vibrant cultures' in their destinationDescription, filter them to show only those that are currently popular, calculate the percentage of destinations that are popular, and group the results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "tropical beaches with vibrant cultures", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "tropical beaches with vibrant cultures" + }, + "boolean_property_filter": { + "property_name": "isPopular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isPopular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.875, + "error": null + }, + { + "query_index": 210, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations with sunny beaches and vibrant nightlife, filter for where they are currently popular, and count these popular destinations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations with sunny beaches and vibrant nightlife, filter for where they are currently popular, and count these popular destinations.", + "target_collection": "TravelDestinations", + "search_query": "sunny beaches and vibrant nightlife", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations with sunny beaches and vibrant nightlife, filter for where they are currently popular, and count these popular destinations.", + "target_collection": "TravelDestinations", + "search_query": "sunny beaches and vibrant nightlife", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "popularity", + "operator": "LIKE", + "value": "popular" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 211, + "database_schema_index": 3, + "natural_language_query": "Find popular travel destinations with descriptions that include scenic vistas and vibrant cultures, and group these destinations by their destinationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find popular travel destinations with descriptions that include scenic vistas and vibrant cultures, and group these destinations by their destinationName.", + "target_collection": "TravelDestinations", + "search_query": "Explore scenic vistas and vibrant cultures", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find popular travel destinations with descriptions that include scenic vistas and vibrant cultures, and group these destinations by their destinationName.", + "target_collection": "TravelDestinations", + "search_query": "scenic vistas and vibrant cultures", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 212, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that are popular and include descriptions related to 'tropical beaches and adventure sports'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that are popular and include descriptions related to 'tropical beaches and adventure sports'.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that include descriptions related to 'tropical beaches and adventure sports' within the destinationDescription.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that are popular and include descriptions related to 'tropical beaches and adventure sports'.", + "target_collection": "TravelDestinations", + "search_query": "tropical beaches and adventure sports", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "popularityScore", + "metrics": "MEAN" + }, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 213, + "database_schema_index": 3, + "natural_language_query": "Identify travel packages providing a relaxing beach holiday (using search_query on packageDetails). Within these, calculate the average packagePrice (using int_property_aggregation on packagePrice), and group the results by whether there is a discountAvailable (using groupby on discountAvailable).", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Identify travel packages providing a relaxing beach holiday (using search_query on packageDetails). Within these, calculate the average packagePrice (using int_property_aggregation on packagePrice), and group the results by whether there is a discountAvailable (using groupby on discountAvailable).", + "target_collection": "TravelPackages", + "search_query": "Find travel packages that offer a relaxing beach holiday", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify travel packages providing a relaxing beach holiday (using search_query on packageDetails). Within these, calculate the average packagePrice (using int_property_aggregation on packagePrice), and group the results by whether there is a discountAvailable (using groupby on discountAvailable).", + "target_collection": "TravelPackages", + "search_query": "relaxing beach holiday", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 214, + "database_schema_index": 3, + "natural_language_query": "What is the average cost of visiting tropical beach resorts described in detail?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What is the average cost of visiting tropical beach resorts described in detail?", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that match the detailed description of tropical beach resorts.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average cost of visiting tropical beach resorts described in detail?", + "target_collection": "Resorts", + "search_query": "tropical beach resorts described in detail", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "cost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 215, + "database_schema_index": 3, + "natural_language_query": "List travel destinations matching a description of 'tropical beaches', count the different destination names, and group results by whether they are popular to see which group has more destinations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "List travel destinations matching a description of 'tropical beaches', count the different destination names, and group results by whether they are popular to see which group has more destinations.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that best match the description 'tropical beaches'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "List travel destinations matching a description of 'tropical beaches', count the different destination names, and group results by whether they are popular to see which group has more destinations.", + "target_collection": "TravelDestinations", + "search_query": "tropical beaches", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1000 + }, + "boolean_property_aggregation": null, + "groupby_property": "isPopular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 216, + "database_schema_index": 3, + "natural_language_query": "Find destinations that are conceptually similar to 'romantic getaway with beach access', and also list the top 5 most common destination names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find destinations that are conceptually similar to 'romantic getaway with beach access', and also list the top 5 most common destination names.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations that are conceptually similar to 'romantic getaway with beach access'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find destinations that are conceptually similar to 'romantic getaway with beach access', and also list the top 5 most common destination names.", + "target_collection": "Destinations", + "search_query": "romantic getaway with beach access", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 217, + "database_schema_index": 3, + "natural_language_query": "What percentage of destinations, grouped by destination names, are popular among tourists, and which of these have similar descriptions to 'romantic beaches with vibrant nightlife'? Please find matching entries using semantic search, and analyze the proportion of those considered popular using boolean property aggregation for the 'popular' field.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What percentage of destinations, grouped by destination names, are popular among tourists, and which of these have similar descriptions to 'romantic beaches with vibrant nightlife'? Please find matching entries using semantic search, and analyze the proportion of those considered popular using boolean property aggregation for the 'popular' field.", + "target_collection": "TravelDestinations", + "search_query": "Find destinations similar to 'romantic beaches with vibrant nightlife.'", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "What percentage of destinations, grouped by destination names, are popular among tourists, and which of these have similar descriptions to 'romantic beaches with vibrant nightlife'? Please find matching entries using semantic search, and analyze the proportion of those considered popular using boolean property aggregation for the 'popular' field.", + "target_collection": "Destinations", + "search_query": "romantic beaches with vibrant nightlife", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 218, + "database_schema_index": 3, + "natural_language_query": "What percentage of travel destinations, that match snowy mountains and vibrant city life descriptions, are currently popular among tourists?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What percentage of travel destinations, that match snowy mountains and vibrant city life descriptions, are currently popular among tourists?", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that match descriptions of snowy mountains and vibrant city life.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What percentage of travel destinations, that match snowy mountains and vibrant city life descriptions, are currently popular among tourists?", + "target_collection": "TravelDestinations", + "search_query": "snowy mountains and vibrant city life", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isPopular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 219, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that match the theme 'tropical beach with vibrant nightlife', and group the results based on whether they are popular among tourists.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that match the theme 'tropical beach with vibrant nightlife', and group the results based on whether they are popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": "Find travel destinations that match the query \"tropical beach with vibrant nightlife\".", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that match the theme 'tropical beach with vibrant nightlife', and group the results based on whether they are popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": "tropical beach with vibrant nightlife", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "isPopularAmongTourists", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 220, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that are conceptually similar to 'romantic nature getaways' based on the destinationDescription.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that are conceptually similar to 'romantic nature getaways' based on the destinationDescription.", + "target_collection": "TravelDestinations", + "search_query": "{\"destinationDescription\":{\"operator\":\"search_query\",\"value\":\"romantic nature getaways\"}}", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that are conceptually similar to 'romantic nature getaways' based on the destinationDescription.", + "target_collection": "TravelDestinations", + "search_query": "romantic nature getaways", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "%romantic nature getaways%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 221, + "database_schema_index": 3, + "natural_language_query": "Count how many travel agents have more than 5 years of experience, and group them by their agentName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Count how many travel agents have more than 5 years of experience, and group them by their agentName.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "agentName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Count how many travel agents have more than 5 years of experience, and group them by their agentName.", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "agentName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 222, + "database_schema_index": 3, + "natural_language_query": "Find travel agents who have at least 10 years in yearsOfExperience and determine the average years of experience among all travel agents.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel agents who have at least 10 years in yearsOfExperience and determine the average years of experience among all travel agents.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel agents who have at least 10 years in yearsOfExperience and determine the average years of experience among all travel agents.", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 223, + "database_schema_index": 3, + "natural_language_query": "Find travel agents who have at least 5 years in yearsOfExperience, count how many travel agents share the same agentName, and categorize the results based on whether they are availableNow.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel agents who have at least 5 years in yearsOfExperience, count how many travel agents share the same agentName, and categorize the results based on whether they are availableNow.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "availableNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel agents who have at least 5 years in yearsOfExperience, count how many travel agents share the same agentName, and categorize the results based on whether they are availableNow.", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "agentName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1000000 + }, + "boolean_property_aggregation": null, + "groupby_property": "availableNow", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 224, + "database_schema_index": 3, + "natural_language_query": "Show all travel agents with at least 5 years of experience and count the number of unique agentName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Show all travel agents with at least 5 years of experience and count the number of unique agentName.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Show all travel agents with at least 5 years of experience and count the number of unique agentName.", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "agentName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1000000 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 225, + "database_schema_index": 3, + "natural_language_query": "Find travel packages that cost no more than 2000 in packagePrice, group these results by packageName, and count the total number of packages with discounts by evaluating discountAvailable.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel packages that cost no more than 2000 in packagePrice, group these results by packageName, and count the total number of packages with discounts by evaluating discountAvailable.", + "target_collection": "TravelPackages", + "search_query": null, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<=", + "value": 2000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "packageName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel packages that cost no more than 2000 in packagePrice, group these results by packageName, and count the total number of packages with discounts by evaluating discountAvailable.", + "target_collection": "TravelPackages", + "search_query": "", + "limit": 5, + "integer_property_filter": { + "property_name": "packagePrice", + "operator": "<=", + "value": 2000.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "discountAvailable", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "packageName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 226, + "database_schema_index": 3, + "natural_language_query": "Find travel agents with at least 5 years of experience and count how many are available now.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel agents with at least 5 years of experience and count how many are available now.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel agents with at least 5 years of experience and count how many are available now.", + "target_collection": "TravelAgents", + "search_query": "", + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5.0 + }, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "availableNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 227, + "database_schema_index": 3, + "natural_language_query": "Group travel agents by their yearsOfExperience and only include those that have more than 5 years in yearsOfExperience.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Group travel agents by their yearsOfExperience and only include those that have more than 5 years in yearsOfExperience.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "yearsOfExperience" + }, + "predicted_query": { + "corresponding_natural_language_query": "Group travel agents by their yearsOfExperience and only include those that have more than 5 years in yearsOfExperience.", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "yearsOfExperience", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 228, + "database_schema_index": 3, + "natural_language_query": "Find travel agents with at least 5 years of experience in yearsOfExperience.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel agents with at least 5 years of experience in yearsOfExperience.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel agents with at least 5 years of experience in yearsOfExperience.", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "yearsOfExperience", + "operator": ">=", + "value": 5 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 229, + "database_schema_index": 3, + "natural_language_query": "Find travel packages where the packageDetails include the keyword 'luxury', then compute the average of packagePrice for packages where discountAvailable is true, and group the results based on whether a discount is available.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel packages where the packageDetails include the keyword 'luxury', then compute the average of packagePrice for packages where discountAvailable is true, and group the results based on whether a discount is available.", + "target_collection": "TravelPackages", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "packageDetails", + "operator": "LIKE", + "value": "luxury" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel packages where the packageDetails include the keyword 'luxury', then compute the average of packagePrice for packages where discountAvailable is true, and group the results based on whether a discount is available.", + "target_collection": "TravelPackages", + "search_query": "luxury", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "discountAvailable", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "discountAvailable", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 230, + "database_schema_index": 3, + "natural_language_query": "Determine the average averageVisitCost for travel destinations where destinationDescription contains the keyword 'beach'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Determine the average averageVisitCost for travel destinations where destinationDescription contains the keyword 'beach'.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Determine the average averageVisitCost for travel destinations where destinationDescription contains the keyword 'beach'.", + "target_collection": "TravelDestinations", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + }, + { + "query_index": 231, + "database_schema_index": 3, + "natural_language_query": "List all travel destinations where the destinationDescription mentions 'popular', count how many destinations have such a description, and group these results by destinationName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "List all travel destinations where the destinationDescription mentions 'popular', count how many destinations have such a description, and group these results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "%popular%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "List all travel destinations where the destinationDescription mentions 'popular', count how many destinations have such a description, and group these results by destinationName.", + "target_collection": "TravelDestinations", + "search_query": "popular", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "id", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 232, + "database_schema_index": 3, + "natural_language_query": "Find all destinations in TravelDestinations where the destinationDescription contains the word 'beach', and count how many such destinations exist.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find all destinations in TravelDestinations where the destinationDescription contains the word 'beach', and count how many such destinations exist.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "%beach%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all destinations in TravelDestinations where the destinationDescription contains the word 'beach', and count how many such destinations exist.", + "target_collection": "TravelDestinations", + "search_query": "beach", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 233, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations where the destinationDescription includes 'beach', group the results by destinationName and count how many of these destinations are popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations where the destinationDescription includes 'beach', group the results by destinationName and count how many of these destinations are popular.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations where the destinationDescription includes 'beach', group the results by destinationName and count how many of these destinations are popular.", + "target_collection": "TravelDestinations", + "search_query": "beach", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isPopular", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 234, + "database_schema_index": 3, + "natural_language_query": "Show me travel destinations that include 'Beach' in their destinationName and count how many of them are popular using the popular attribute.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Show me travel destinations that include 'Beach' in their destinationName and count how many of them are popular using the popular attribute.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "Beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Show me travel destinations that include 'Beach' in their destinationName and count how many of them are popular using the popular attribute.", + "target_collection": "TravelDestinations", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationName", + "operator": "LIKE", + "value": "Beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + }, + { + "query_index": 235, + "database_schema_index": 3, + "natural_language_query": "Find all travel destinations where the destinationDescription contains the keyword 'beach', and group the results by whether or not the destination is popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find all travel destinations where the destinationDescription contains the keyword 'beach', and group the results by whether or not the destination is popular.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "beach" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all travel destinations where the destinationDescription contains the keyword 'beach', and group the results by whether or not the destination is popular.", + "target_collection": "TravelDestinations", + "search_query": "beach", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "isPopular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + }, + { + "query_index": 236, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations with descriptions that contain the keyword 'beaches' in destinationDescription.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations with descriptions that contain the keyword 'beaches' in destinationDescription.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "beaches" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations with descriptions that contain the keyword 'beaches' in destinationDescription.", + "target_collection": "TravelDestinations", + "search_query": "beaches", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "destinationDescription", + "operator": "LIKE", + "value": "%beaches%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 237, + "database_schema_index": 3, + "natural_language_query": "Find the average cost of all travel destinations that are popular, and group the results by each destination name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find the average cost of all travel destinations that are popular, and group the results by each destination name.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the average cost of all travel destinations that are popular, and group the results by each destination name.", + "target_collection": "TravelDestinations", + "search_query": "popular", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "cost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 238, + "database_schema_index": 3, + "natural_language_query": "Find the total sum of packagePrice for all travel packages where discountAvailable is true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find the total sum of packagePrice for all travel packages where discountAvailable is true.", + "target_collection": "TravelPackages", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "discountAvailable", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the total sum of packagePrice for all travel packages where discountAvailable is true.", + "target_collection": "TravelPackages", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "discountAvailable", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "packagePrice", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 239, + "database_schema_index": 3, + "natural_language_query": "List and categorize all popular travel destinations by their names, and for each destination, count the number of detailed descriptions available, ensuring that only destinations currently popular among tourists are included.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "List and categorize all popular travel destinations by their names, and for each destination, count the number of detailed descriptions available, ensuring that only destinations currently popular among tourists are included.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "List and categorize all popular travel destinations by their names, and for each destination, count the number of detailed descriptions available, ensuring that only destinations currently popular among tourists are included.", + "target_collection": "TravelDestinations", + "search_query": "popular among tourists", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10 + }, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.7000000000000001, + "error": null + }, + { + "query_index": 240, + "database_schema_index": 3, + "natural_language_query": "Retrieve destinations with destinationName that are currently popular, then count the number of unique destinationName values.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Retrieve destinations with destinationName that are currently popular, then count the number of unique destinationName values.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 241, + "database_schema_index": 3, + "natural_language_query": "Find me all travel packages where there is a discountAvailable, count how many packages have a discount and organize the results by packageName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find me all travel packages where there is a discountAvailable, count how many packages have a discount and organize the results by packageName.", + "target_collection": "TravelPackages", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "discountAvailable", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "packageName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find me all travel packages where there is a discountAvailable, count how many packages have a discount and organize the results by packageName.", + "target_collection": "TravelPackages", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "discountAvailable", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "packageName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 242, + "database_schema_index": 3, + "natural_language_query": "Find all travel destinations where the destination is currently popular, and calculate the percentage of all travel destinations that are popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find all travel destinations where the destination is currently popular, and calculate the percentage of all travel destinations that are popular.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all travel destinations where the destination is currently popular, and calculate the percentage of all travel destinations that are popular.", + "target_collection": "TravelDestinations", + "search_query": "currently popular", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isPopular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 243, + "database_schema_index": 3, + "natural_language_query": "Find popular travel destinations, where 'popular' equals true, and group results by 'destinationName'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find popular travel destinations, where 'popular' equals true, and group results by 'destinationName'.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find popular travel destinations, where 'popular' equals true, and group results by 'destinationName'.", + "target_collection": "TravelDestinations", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 244, + "database_schema_index": 3, + "natural_language_query": "Find travel destinations that are popular among tourists.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Find travel destinations that are popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "popular", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find travel destinations that are popular among tourists.", + "target_collection": "TravelDestinations", + "search_query": "popular among tourists", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 245, + "database_schema_index": 3, + "natural_language_query": "Count the number of travel agents grouped by their availability status, using the yearsOfExperience property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Count the number of travel agents grouped by their availability status, using the yearsOfExperience property.", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "availableNow" + }, + "predicted_query": { + "corresponding_natural_language_query": "Count the number of travel agents grouped by their availability status, using the yearsOfExperience property.", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isAvailable", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "isAvailable", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 246, + "database_schema_index": 3, + "natural_language_query": "What is the average yearsOfExperience for all travel agents in the TravelAgents collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What is the average yearsOfExperience for all travel agents in the TravelAgents collection?", + "target_collection": "TravelAgents", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the average yearsOfExperience for all travel agents in the TravelAgents collection?", + "target_collection": "TravelAgents", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "yearsOfExperience", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 247, + "database_schema_index": 3, + "natural_language_query": "What is the count of each travel destination name grouped by whether the destination is popular?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What is the count of each travel destination name grouped by whether the destination is popular?", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the count of each travel destination name grouped by whether the destination is popular?", + "target_collection": "TravelDestinations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1000000 + }, + "boolean_property_aggregation": null, + "groupby_property": "isPopular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 248, + "database_schema_index": 3, + "natural_language_query": "What is the most common destination name in the Travel Destinations collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "What is the most common destination name in the Travel Destinations collection?", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the most common destination name in the Travel Destinations collection?", + "target_collection": "Travel Destinations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "destinationName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 249, + "database_schema_index": 3, + "natural_language_query": "Show the percentage of popular destinations for each destinationName by grouping the destinations and calculating how many are marked as popular.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Show the percentage of popular destinations for each destinationName by grouping the destinations and calculating how many are marked as popular.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "popular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show the percentage of popular destinations for each destinationName by grouping the destinations and calculating how many are marked as popular.", + "target_collection": "Destinations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isPopular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "destinationName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.0, + "error": null + }, + { + "query_index": 250, + "database_schema_index": 3, + "natural_language_query": "Count how many travel destinations are currently popular and calculate the percentage of popular destinations in the TravelDestinations collection.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Count how many travel destinations are currently popular and calculate the percentage of popular destinations in the TravelDestinations collection.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Count how many travel destinations are currently popular and calculate the percentage of popular destinations in the TravelDestinations collection.", + "target_collection": "TravelDestinations", + "search_query": "currently popular", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "id", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isPopular", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 251, + "database_schema_index": 3, + "natural_language_query": "Group all travel destinations by the boolean property popular and determine the averageVisitCost for each group to understand the cost difference between popular and non-popular destinations.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "TravelDestinations", + "properties": [ + { + "name": "destinationName", + "data_type": [ + "string" + ], + "description": "The name of the travel destination." + }, + { + "name": "destinationDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the destination including attractions, culture, and climate." + }, + { + "name": "averageVisitCost", + "data_type": [ + "number" + ], + "description": "The average cost of a trip to the destination." + }, + { + "name": "popular", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the destination is currently popular among tourists." + } + ], + "envisioned_use_case_overview": "This schema allows users to explore travel destinations based on detailed descriptions and average costs. Semantic search can help users find destinations that match desired experiences or budget levels." + }, + { + "name": "TravelAgents", + "properties": [ + { + "name": "agentName", + "data_type": [ + "string" + ], + "description": "The full name of the travel agent." + }, + { + "name": "agentDescription", + "data_type": [ + "string" + ], + "description": "A detailed description of the agent's expertise, including specialties and customer reviews." + }, + { + "name": "yearsOfExperience", + "data_type": [ + "number" + ], + "description": "The number of years the agent has been in the industry." + }, + { + "name": "availableNow", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the travel agent is currently available for consultation." + } + ], + "envisioned_use_case_overview": "This schema supports customers in finding travel agents based on expertise and availability. Semantic search enables matching with agents who have specific regional knowledge or customer service excellence." + }, + { + "name": "TravelPackages", + "properties": [ + { + "name": "packageName", + "data_type": [ + "string" + ], + "description": "The name of the travel package." + }, + { + "name": "packageDetails", + "data_type": [ + "string" + ], + "description": "A comprehensive description of the travel package, including itinerary and included services." + }, + { + "name": "packagePrice", + "data_type": [ + "number" + ], + "description": "The total price of the travel package." + }, + { + "name": "discountAvailable", + "data_type": [ + "boolean" + ], + "description": "Indicates whether there is a discount available on the package." + } + ], + "envisioned_use_case_overview": "This schema helps travelers find travel packages based on detailed descriptions and pricing. Semantic search allows for discovering packages that align with preferences for activities or budget constraints." + } + ] + }, + "corresponding_natural_language_query": "Group all travel destinations by the boolean property popular and determine the averageVisitCost for each group to understand the cost difference between popular and non-popular destinations.", + "target_collection": "TravelDestinations", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular" + }, + "predicted_query": { + "corresponding_natural_language_query": "Group all travel destinations by the boolean property popular and determine the averageVisitCost for each group to understand the cost difference between popular and non-popular destinations.", + "target_collection": "TravelDestinations", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitCost", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "popular", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 252, + "database_schema_index": 3, + "natural_language_query": "Explore art pieces of significant historical relevance, filter those with a currentValuation greater than 1,000,000, calculate the average currentValuation, and group the results by their onDisplay status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Explore art pieces of significant historical relevance, filter those with a currentValuation greater than 1,000,000, calculate the average currentValuation, and group the results by their onDisplay status.", + "target_collection": "ArtPieces", + "search_query": "Explore art pieces of significant historical relevance", + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "onDisplay" + }, + "predicted_query": { + "corresponding_natural_language_query": "Explore art pieces of significant historical relevance, filter those with a currentValuation greater than 1,000,000, calculate the average currentValuation, and group the results by their onDisplay status.", + "target_collection": "ArtPieces", + "search_query": "significant historical relevance", + "limit": 5, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "onDisplay", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 253, + "database_schema_index": 3, + "natural_language_query": "Find the average currentValuation of art pieces with significant historical details in their artPieceHistory where the currentValuation is greater than 1,000,000.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find the average currentValuation of art pieces with significant historical details in their artPieceHistory where the currentValuation is greater than 1,000,000.", + "target_collection": "ArtPieces", + "search_query": "Explore notable art pieces with historical significance described in their artPieceHistory", + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the average currentValuation of art pieces with significant historical details in their artPieceHistory where the currentValuation is greater than 1,000,000.", + "target_collection": "ArtPieces", + "search_query": "significant historical details in their artPieceHistory", + "limit": 5, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 254, + "database_schema_index": 3, + "natural_language_query": "Explore exhibitions that feature modern art and innovative installations, focusing only on those with an averageVisitorCount above 100, grouped by the exhibitionTitle to identify how many unique exhibitions match this criterion.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Explore exhibitions that feature modern art and innovative installations, focusing only on those with an averageVisitorCount above 100, grouped by the exhibitionTitle to identify how many unique exhibitions match this criterion.", + "target_collection": "Exhibitions", + "search_query": "modern art and innovative installations", + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 255, + "database_schema_index": 3, + "natural_language_query": "Find exhibitions with descriptions about exploring the influence of Impressionism, where the averageVisitorCount is greater than 500, and count unique exhibition titles.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions with descriptions about exploring the influence of Impressionism, where the averageVisitorCount is greater than 500, and count unique exhibition titles.", + "target_collection": "Exhibitions", + "search_query": "exploring the influence of Impressionism", + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions with descriptions about exploring the influence of Impressionism, where the averageVisitorCount is greater than 500, and count unique exhibition titles.", + "target_collection": "Exhibitions", + "search_query": "exploring the influence of Impressionism", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "title", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1000000 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 256, + "database_schema_index": 4, + "natural_language_query": "Find top museums highlighting Renaissance art, where entry fees are no more than 20, group results by exhibitHighlights, and determine how many are open today.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find top museums highlighting Renaissance art, where entry fees are no more than 20, group results by exhibitHighlights, and determine how many are open today.", + "target_collection": "Museums", + "search_query": "Top museums highlighting Renaissance art", + "integer_property_filter": { + "property_name": "entryFee", + "operator": "<=", + "value": 20 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitHighlights" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find top museums highlighting Renaissance art, where entry fees are no more than 20, group results by exhibitHighlights, and determine how many are open today.", + "target_collection": "Museums", + "search_query": "Renaissance art", + "limit": 5, + "integer_property_filter": { + "property_name": "entryFee", + "operator": "<=", + "value": 20.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "exhibitHighlights", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 257, + "database_schema_index": 4, + "natural_language_query": "List exhibitions with cultural themes in their exhibitionDescription that have an averageVisitorCount greater than 100, and summarize how many of these exhibitions are currentlyRunning.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "List exhibitions with cultural themes in their exhibitionDescription that have an averageVisitorCount greater than 100, and summarize how many of these exhibitions are currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": "cultural themes", + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "List exhibitions with cultural themes in their exhibitionDescription that have an averageVisitorCount greater than 100, and summarize how many of these exhibitions are currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": "cultural themes in exhibitionDescription", + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 100.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyRunning", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 258, + "database_schema_index": 4, + "natural_language_query": "Find museums where the exhibit highlights emphasize historical significance, filter for museums with entry fees exceeding 10, and group the results by each museum's name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums where the exhibit highlights emphasize historical significance, filter for museums with entry fees exceeding 10, and group the results by each museum's name.", + "target_collection": "Museums", + "search_query": "exhibitHighlights", + "integer_property_filter": { + "property_name": "entryFee", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums where the exhibit highlights emphasize historical significance, filter for museums with entry fees exceeding 10, and group the results by each museum's name.", + "target_collection": "Museums", + "search_query": "exhibit highlights emphasize historical significance", + "limit": 5, + "integer_property_filter": { + "property_name": "entryFee", + "operator": ">", + "value": 10.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 259, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibitHighlights relevant to 'Impressionist art' that also have an entryFee greater than $10.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibitHighlights relevant to 'Impressionist art' that also have an entryFee greater than $10.", + "target_collection": "Museums", + "search_query": "Impressionist art", + "integer_property_filter": { + "property_name": "entryFee", + "operator": ">", + "value": 10 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibitHighlights relevant to 'Impressionist art' that also have an entryFee greater than $10.", + "target_collection": "Museums", + "search_query": "Impressionist art", + "limit": 5, + "integer_property_filter": { + "property_name": "entryFee", + "operator": ">", + "value": 10.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 260, + "database_schema_index": 4, + "natural_language_query": "Search for art pieces with significant historical relevance using their artPieceHistory, filter for those that have 'Monet' in artPieceName, calculate the average of currentValuation, and group the results by their onDisplay status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Search for art pieces with significant historical relevance using their artPieceHistory, filter for those that have 'Monet' in artPieceName, calculate the average of currentValuation, and group the results by their onDisplay status.", + "target_collection": "ArtPieces", + "search_query": "Find artworks with significant historical relevance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceName", + "operator": "LIKE", + "value": "%Monet%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "onDisplay" + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for art pieces with significant historical relevance using their artPieceHistory, filter for those that have 'Monet' in artPieceName, calculate the average of currentValuation, and group the results by their onDisplay status.", + "target_collection": "ArtPieces", + "search_query": "significant historical relevance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceName", + "operator": "LIKE", + "value": "Monet" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "onDisplay", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 261, + "database_schema_index": 4, + "natural_language_query": "Search for museums whose exhibitHighlights semantically match 'famous art exhibits with rich historical significance', where museumName is exactly 'Louvre', and compute the sum of entryFee.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Search for museums whose exhibitHighlights semantically match 'famous art exhibits with rich historical significance', where museumName is exactly 'Louvre', and compute the sum of entryFee.", + "target_collection": "Museums", + "search_query": "explore famous art exhibits with rich historical significance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "=", + "value": "Louvre" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Search for museums whose exhibitHighlights semantically match 'famous art exhibits with rich historical significance', where museumName is exactly 'Louvre', and compute the sum of entryFee.", + "target_collection": "Museums", + "search_query": "famous art exhibits with rich historical significance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "=", + "value": "Louvre" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 262, + "database_schema_index": 4, + "natural_language_query": "Retrieve museums with exhibit highlights similar to 'ancient artifacts', filter specifically on museums named 'Smithsonian', count the unique exhibit highlights available, and group the results by the museum name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Retrieve museums with exhibit highlights similar to 'ancient artifacts', filter specifically on museums named 'Smithsonian', count the unique exhibit highlights available, and group the results by the museum name.", + "target_collection": "Museums", + "search_query": "Find museums with exhibit highlights similar to 'ancient artifacts'.", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "=", + "value": "Smithsonian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Retrieve museums with exhibit highlights similar to 'ancient artifacts', filter specifically on museums named 'Smithsonian', count the unique exhibit highlights available, and group the results by the museum name.", + "target_collection": "Museums", + "search_query": "ancient artifacts", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "Smithsonian" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10000 + }, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 263, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions that focus on impressionist themes, check if they are currently running, and count the total number of distinct exhibition titles.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions that focus on impressionist themes, check if they are currently running, and count the total number of distinct exhibition titles.", + "target_collection": "Exhibitions", + "search_query": "Explore exhibitions that focus on impressionist themes in exhibitionDescription", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions that focus on impressionist themes, check if they are currently running, and count the total number of distinct exhibition titles.", + "target_collection": "Exhibitions", + "search_query": "impressionist themes", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "title", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10000 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 264, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibits highlighting the historical significance of Vincent van Gogh's pieces using semantic search, filter for museums whose names include 'National', aggregate by counting the number of museums open today, and group results by museumName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibits highlighting the historical significance of Vincent van Gogh's pieces using semantic search, filter for museums whose names include 'National', aggregate by counting the number of museums open today, and group results by museumName.", + "target_collection": "Museums", + "search_query": "historical significance of Vincent van Gogh's pieces", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "LIKE", + "value": "National" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibits highlighting the historical significance of Vincent van Gogh's pieces using semantic search, filter for museums whose names include 'National', aggregate by counting the number of museums open today, and group results by museumName.", + "target_collection": "Museums", + "search_query": "exhibits highlighting the historical significance of Vincent van Gogh's pieces", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "National" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 265, + "database_schema_index": 4, + "natural_language_query": "Find museums that are most relevant to \"historical importance\" based on exhibitHighlights. Include only those museums where the museumName contains \"Art Gallery\", and show the percentage of these that are openToday.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums that are most relevant to \"historical importance\" based on exhibitHighlights. Include only those museums where the museumName contains \"Art Gallery\", and show the percentage of these that are openToday.", + "target_collection": "Museums", + "search_query": "historical importance", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "LIKE", + "value": "Art Gallery" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums that are most relevant to \"historical importance\" based on exhibitHighlights. Include only those museums where the museumName contains \"Art Gallery\", and show the percentage of these that are openToday.", + "target_collection": "Museums", + "search_query": "historical importance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "LIKE", + "value": "Art Gallery" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "exhibitHighlights", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 266, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions that are about modern art with innovative displays by looking at the exhibition descriptions. Filter these exhibitions to include only those with 'Masterpiece' in their titles. Then, group the results based on whether the exhibitions are currently running or not.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions that are about modern art with innovative displays by looking at the exhibition descriptions. Filter these exhibitions to include only those with 'Masterpiece' in their titles. Then, group the results based on whether the exhibitions are currently running or not.", + "target_collection": "Exhibitions", + "search_query": "Discover exhibitions about modern art with a focus on innovative displays", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitionTitle", + "operator": "LIKE", + "value": "Masterpiece" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions that are about modern art with innovative displays by looking at the exhibition descriptions. Filter these exhibitions to include only those with 'Masterpiece' in their titles. Then, group the results based on whether the exhibitions are currently running or not.", + "target_collection": "Exhibitions", + "search_query": "modern art with innovative displays", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "title", + "operator": "LIKE", + "value": "Masterpiece" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "isCurrentlyRunning", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 267, + "database_schema_index": 4, + "natural_language_query": "Which museums, including those with names similar to 'Art Museum', have collections described as having significant cultural impact?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Which museums, including those with names similar to 'Art Museum', have collections described as having significant cultural impact?", + "target_collection": "Museums", + "search_query": "The cultural significance of the museum's collection and unique exhibits that attract thousands of visitors.", + "integer_property_filter": null, + "text_property_filter": { + "property_name": "museumName", + "operator": "LIKE", + "value": "*Art Museum*" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Which museums, including those with names similar to 'Art Museum', have collections described as having significant cultural impact?", + "target_collection": "Museums", + "search_query": "collections with significant cultural impact", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "name", + "operator": "LIKE", + "value": "Art Museum" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 268, + "database_schema_index": 4, + "natural_language_query": "What are the museums, grouped by their names, that have exhibit highlights including renaissance art and are open today, along with the sum of their entry fees?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "What are the museums, grouped by their names, that have exhibit highlights including renaissance art and are open today, along with the sum of their entry fees?", + "target_collection": "Museums", + "search_query": "exhibitHighlights including 'renaissance art'.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the museums, grouped by their names, that have exhibit highlights including renaissance art and are open today, along with the sum of their entry fees?", + "target_collection": "Museums", + "search_query": "exhibit highlights including renaissance art", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 269, + "database_schema_index": 4, + "natural_language_query": "Find currently running exhibitions that explore the theme of Renaissance art and calculate the average visitor count.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find currently running exhibitions that explore the theme of Renaissance art and calculate the average visitor count.", + "target_collection": "Exhibitions", + "search_query": "Explore the theme of Renaissance art.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find currently running exhibitions that explore the theme of Renaissance art and calculate the average visitor count.", + "target_collection": "Exhibitions", + "search_query": "Renaissance art", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isCurrentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "visitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9, + "error": null + }, + { + "query_index": 270, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions with thematic content related to 'contemporary art' that are currently running, categorize them by exhibitionTitle, and count the number of occurrences of each exhibitionTitle.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions with thematic content related to 'contemporary art' that are currently running, categorize them by exhibitionTitle, and count the number of occurrences of each exhibitionTitle.", + "target_collection": "Exhibitions", + "search_query": "contemporary art", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions with thematic content related to 'contemporary art' that are currently running, categorize them by exhibitionTitle, and count the number of occurrences of each exhibitionTitle.", + "target_collection": "Exhibitions", + "search_query": "contemporary art", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "status", + "operator": "=", + "value": "running" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitionTitle", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1000 + }, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 271, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibits that have historical significance and are open today, and count the number of unique museum names.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibits that have historical significance and are open today, and count the number of unique museum names.", + "target_collection": "Museums", + "search_query": "Search for museums that have exhibits with historical significance in their exhibitHighlights", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibits that have historical significance and are open today, and count the number of unique museum names.", + "target_collection": "Museums", + "search_query": "exhibits with historical significance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "name", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10000 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 272, + "database_schema_index": 4, + "natural_language_query": "Explore museums with notable exhibit highlights that include ancient history artifacts, find which ones are open today, count the total number of museums open today, and segment the results by the museum name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Explore museums with notable exhibit highlights that include ancient history artifacts, find which ones are open today, count the total number of museums open today, and segment the results by the museum name.", + "target_collection": "Museums", + "search_query": "Explore museums with notable exhibitHighlights that include ancient history artifacts", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Explore museums with notable exhibit highlights that include ancient history artifacts, find which ones are open today, count the total number of museums open today, and segment the results by the museum name.", + "target_collection": "Museums", + "search_query": "notable exhibit highlights that include ancient history artifacts", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 273, + "database_schema_index": 4, + "natural_language_query": "Find museums that have notable exhibits with historical significance, indicate if they are open today, and provide the percentage of museums that are indeed open today.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums that have notable exhibits with historical significance, indicate if they are open today, and provide the percentage of museums that are indeed open today.", + "target_collection": "Museums", + "search_query": "exhibitHighlights", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums that have notable exhibits with historical significance, indicate if they are open today, and provide the percentage of museums that are indeed open today.", + "target_collection": "Museums", + "search_query": "notable exhibits with historical significance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "openToday", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 274, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibits related to the Renaissance that are open today, and group the results by the museum's name.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibits related to the Renaissance that are open today, and group the results by the museum's name.", + "target_collection": "Museums", + "search_query": "Renaissance exhibits", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibits related to the Renaissance that are open today, and group the results by the museum's name.", + "target_collection": "Museums", + "search_query": "Renaissance exhibits", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 275, + "database_schema_index": 4, + "natural_language_query": "Find museums that highlight Renaissance art exhibits using semantic search on the exhibitHighlights property and filter to only those where openToday is true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums that highlight Renaissance art exhibits using semantic search on the exhibitHighlights property and filter to only those where openToday is true.", + "target_collection": "Museums", + "search_query": "Find museums that highlight Renaissance art exhibits", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums that highlight Renaissance art exhibits using semantic search on the exhibitHighlights property and filter to only those where openToday is true.", + "target_collection": "Museums", + "search_query": "Renaissance art exhibits", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitHighlights", + "operator": "LIKE", + "value": "Renaissance art exhibits" + }, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 276, + "database_schema_index": 4, + "natural_language_query": "Find museums that have Impressionist art mentioned in their exhibitHighlights, calculate the average entryFee, and group results based on whether they are openToday.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums that have Impressionist art mentioned in their exhibitHighlights, calculate the average entryFee, and group results based on whether they are openToday.", + "target_collection": "Museums", + "search_query": "Explore museums showcasing Impressionist art in their exhibitHighlights.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums that have Impressionist art mentioned in their exhibitHighlights, calculate the average entryFee, and group results based on whether they are openToday.", + "target_collection": "Museums", + "search_query": "Impressionist art", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 277, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions focused on impressionism and calculate the total average visitor count using the averageVisitorCount property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions focused on impressionism and calculate the total average visitor count using the averageVisitorCount property.", + "target_collection": "Exhibitions", + "search_query": "Explore exhibitions focusing on impressionism.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions focused on impressionism and calculate the total average visitor count using the averageVisitorCount property.", + "target_collection": "Exhibitions", + "search_query": "impressionism", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 278, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibits about Renaissance art, categorize the results by their entryFee, and show the 5 most common exhibitHighlights.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibits about Renaissance art, categorize the results by their entryFee, and show the 5 most common exhibitHighlights.", + "target_collection": "Museums", + "search_query": "Search for museums that have exhibits about Renaissance art.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "entryFee" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibits about Renaissance art, categorize the results by their entryFee, and show the 5 most common exhibitHighlights.", + "target_collection": "Museums", + "search_query": "exhibits about Renaissance art", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "entryFee", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 279, + "database_schema_index": 4, + "natural_language_query": "Which museums have the most notable exhibit highlights according to their exhibitHighlights description, and how many distinct museum names are there?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Which museums have the most notable exhibit highlights according to their exhibitHighlights description, and how many distinct museum names are there?", + "target_collection": "Museums", + "search_query": "Find museums with notable exhibits mentioned in exhibitHighlights", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Which museums have the most notable exhibit highlights according to their exhibitHighlights description, and how many distinct museum names are there?", + "target_collection": "Museums", + "search_query": "notable exhibit highlights", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 280, + "database_schema_index": 4, + "natural_language_query": "Identify exhibitions focusing on historical themes, group them by their current status of being open to the public, and compute the percentage of exhibitions that are currently running.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Identify exhibitions focusing on historical themes, group them by their current status of being open to the public, and compute the percentage of exhibitions that are currently running.", + "target_collection": "Exhibitions", + "search_query": "Explore exhibitions with themes of historical significance in their exhibitionDescription.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyRunning", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "currentlyRunning" + }, + "predicted_query": { + "corresponding_natural_language_query": "Identify exhibitions focusing on historical themes, group them by their current status of being open to the public, and compute the percentage of exhibitions that are currently running.", + "target_collection": "Exhibitions", + "search_query": "historical themes", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "isOpen", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "isOpen", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 281, + "database_schema_index": 4, + "natural_language_query": "Find museums with exhibitions related to the Renaissance period and count how many of these museums are open today.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums with exhibitions related to the Renaissance period and count how many of these museums are open today.", + "target_collection": "Museums", + "search_query": "Discover museums with exhibitions related to the Renaissance period in their exhibitHighlights property.", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums with exhibitions related to the Renaissance period and count how many of these museums are open today.", + "target_collection": "Museums", + "search_query": "exhibitions related to the Renaissance period", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 282, + "database_schema_index": 4, + "natural_language_query": "Find museums where the exhibitHighlights mention ancient artifacts and group the results by whether they are openToday.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums where the exhibitHighlights mention ancient artifacts and group the results by whether they are openToday.", + "target_collection": "Museums", + "search_query": "Find museums where exhibitHighlights mention ancient artifacts", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums where the exhibitHighlights mention ancient artifacts and group the results by whether they are openToday.", + "target_collection": "Museums", + "search_query": "ancient artifacts", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 283, + "database_schema_index": 4, + "natural_language_query": "What are the museums with exhibit highlights focusing on ancient civilizations?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "What are the museums with exhibit highlights focusing on ancient civilizations?", + "target_collection": "Museums", + "search_query": "Find museums with exhibit highlights related to ancient civilizations", + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the museums with exhibit highlights focusing on ancient civilizations?", + "target_collection": "Museums", + "search_query": "exhibit highlights focusing on ancient civilizations", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 284, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions where the averageVisitorCount is at least 100, group them by exhibitionTitle, and compute the mean averageVisitorCount for each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is at least 100, group them by exhibitionTitle, and compute the mean averageVisitorCount for each group.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">=", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is at least 100, group them by exhibitionTitle, and compute the mean averageVisitorCount for each group.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">=", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 285, + "database_schema_index": 4, + "natural_language_query": "Find all exhibitions where the averageVisitorCount is greater than 500, and calculate the total sum of averageVisitorCount for these exhibitions.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find all exhibitions where the averageVisitorCount is greater than 500, and calculate the total sum of averageVisitorCount for these exhibitions.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all exhibitions where the averageVisitorCount is greater than 500, and calculate the total sum of averageVisitorCount for these exhibitions.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 500 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 286, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 200, count the number of different exhibition titles, and group the results by whether the exhibition is currentlyRunning.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 200, count the number of different exhibition titles, and group the results by whether the exhibition is currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 200 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 200, count the number of different exhibition titles, and group the results by whether the exhibition is currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 200 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "title", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10000 + }, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 287, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 1000 and count how many unique exhibitionDescription texts there are.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 1000 and count how many unique exhibitionDescription texts there are.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 1000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions where the averageVisitorCount is greater than 1000 and count how many unique exhibitionDescription texts there are.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">", + "value": 1000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitionDescription", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1000000 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 288, + "database_schema_index": 4, + "natural_language_query": "Find museums where the entryFee is 15 or less, aggregate the percentage of museums that are openToday, and group the results by museumName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums where the entryFee is 15 or less, aggregate the percentage of museums that are openToday, and group the results by museumName.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": { + "property_name": "entryFee", + "operator": "<=", + "value": 15 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums where the entryFee is 15 or less, aggregate the percentage of museums that are openToday, and group the results by museumName.", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "entryFee", + "operator": "<=", + "value": 15.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 289, + "database_schema_index": 4, + "natural_language_query": "Find art pieces from ArtPieces with a currentValuation of at least 1,000,000 and count how many of these are onDisplay.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find art pieces from ArtPieces with a currentValuation of at least 1,000,000 and count how many of these are onDisplay.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">=", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find art pieces from ArtPieces with a currentValuation of at least 1,000,000 and count how many of these are onDisplay.", + "target_collection": "ArtPieces", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">=", + "value": 1000000.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "onDisplay", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 290, + "database_schema_index": 4, + "natural_language_query": "Show exhibitions where the averageVisitorCount is greater than or equal to 100, and group the results by the currentlyRunning status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Show exhibitions where the averageVisitorCount is greater than or equal to 100, and group the results by the currentlyRunning status.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">=", + "value": 100 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show exhibitions where the averageVisitorCount is greater than or equal to 100, and group the results by the currentlyRunning status.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "averageVisitorCount", + "operator": ">=", + "value": 100.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 291, + "database_schema_index": 4, + "natural_language_query": "Find art pieces with a currentValuation greater than 1,000,000.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find art pieces with a currentValuation greater than 1,000,000.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find art pieces with a currentValuation greater than 1,000,000.", + "target_collection": "ArtPieces", + "search_query": null, + "limit": 5, + "integer_property_filter": { + "property_name": "currentValuation", + "operator": ">", + "value": 1000000.0 + }, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 292, + "database_schema_index": 4, + "natural_language_query": "For museums that are currently open, calculate the average entry fee grouped by the name of the museum.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "For museums that are currently open, calculate the average entry fee grouped by the name of the museum.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": "true" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "For museums that are currently open, calculate the average entry fee grouped by the name of the museum.", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openNow", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 293, + "database_schema_index": 4, + "natural_language_query": "Find the average currentValuation of all art pieces in the ArtPieces collection whose artPieceHistory contains the word 'Renaissance'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find the average currentValuation of all art pieces in the ArtPieces collection whose artPieceHistory contains the word 'Renaissance'.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceHistory", + "operator": "LIKE", + "value": "Renaissance" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find the average currentValuation of all art pieces in the ArtPieces collection whose artPieceHistory contains the word 'Renaissance'.", + "target_collection": "ArtPieces", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceHistory", + "operator": "LIKE", + "value": "%Renaissance%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 294, + "database_schema_index": 4, + "natural_language_query": "Count the number of unique museums with exhibitHighlights containing 'historical significance' and group these counts by whether or not the museum is open today.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Count the number of unique museums with exhibitHighlights containing 'historical significance' and group these counts by whether or not the museum is open today.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitHighlights", + "operator": "LIKE", + "value": "historical significance" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday" + }, + "predicted_query": { + "corresponding_natural_language_query": "Count the number of unique museums with exhibitHighlights containing 'historical significance' and group these counts by whether or not the museum is open today.", + "target_collection": "Museums", + "search_query": "exhibitHighlights containing 'historical significance'", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitHighlights", + "operator": "LIKE", + "value": "%historical significance%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 295, + "database_schema_index": 4, + "natural_language_query": "Find art pieces where \"Monet\" is mentioned in artPieceHistory, and count the number of unique artPieceName values.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find art pieces where \"Monet\" is mentioned in artPieceHistory, and count the number of unique artPieceName values.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceHistory", + "operator": "LIKE", + "value": "Monet" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find art pieces where \"Monet\" is mentioned in artPieceHistory, and count the number of unique artPieceName values.", + "target_collection": "ArtPieces", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceHistory", + "operator": "LIKE", + "value": "Monet" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "artPieceName", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10000 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 296, + "database_schema_index": 4, + "natural_language_query": "Find museums where exhibitHighlights contain the keyword 'ancient artifacts', calculate what percentage of these museums are openToday, and group the museums by entryFee to see the distribution across different price categories.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums where exhibitHighlights contain the keyword 'ancient artifacts', calculate what percentage of these museums are openToday, and group the museums by entryFee to see the distribution across different price categories.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitHighlights", + "operator": "LIKE", + "value": "ancient artifacts" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "entryFee" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums where exhibitHighlights contain the keyword 'ancient artifacts', calculate what percentage of these museums are openToday, and group the museums by entryFee to see the distribution across different price categories.", + "target_collection": "Museums", + "search_query": "ancient artifacts", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "entryFee", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 297, + "database_schema_index": 4, + "natural_language_query": "Find museums that mention 'renaissance' in their exhibitHighlights and count how many of them are open today.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums that mention 'renaissance' in their exhibitHighlights and count how many of them are open today.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitHighlights", + "operator": "LIKE", + "value": "renaissance" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums that mention 'renaissance' in their exhibitHighlights and count how many of them are open today.", + "target_collection": "Museums", + "search_query": "renaissance", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitHighlights", + "operator": "LIKE", + "value": "renaissance" + }, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 298, + "database_schema_index": 4, + "natural_language_query": "Find exhibitions where the exhibitionTitle contains 'Impressionism' and group the results by currentlyRunning status.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find exhibitions where the exhibitionTitle contains 'Impressionism' and group the results by currentlyRunning status.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitionTitle", + "operator": "LIKE", + "value": "Impressionism" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find exhibitions where the exhibitionTitle contains 'Impressionism' and group the results by currentlyRunning status.", + "target_collection": "Exhibitions", + "search_query": "Impressionism", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "exhibitionTitle", + "operator": "LIKE", + "value": "%Impressionism%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "currentlyRunning", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 299, + "database_schema_index": 4, + "natural_language_query": "Find art pieces where the artPieceName contains the word 'Starry'.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find art pieces where the artPieceName contains the word 'Starry'.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceName", + "operator": "LIKE", + "value": "%Starry%" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find art pieces where the artPieceName contains the word 'Starry'.", + "target_collection": "ArtPieces", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": { + "property_name": "artPieceName", + "operator": "LIKE", + "value": "Starry" + }, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8, + "error": null + }, + { + "query_index": 300, + "database_schema_index": 4, + "natural_language_query": "Find a summary of the total averageVisitorCount for each exhibitionTitle where the exhibition is currentlyRunning.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find a summary of the total averageVisitorCount for each exhibitionTitle where the exhibition is currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find a summary of the total averageVisitorCount for each exhibitionTitle where the exhibition is currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 301, + "database_schema_index": 4, + "natural_language_query": "Find all art pieces that are on display and calculate the total current valuation of these pieces using the `onDisplay` property for filtering and `currentValuation` property for aggregation.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find all art pieces that are on display and calculate the total current valuation of these pieces using the `onDisplay` property for filtering and `currentValuation` property for aggregation.", + "target_collection": "ArtPieces", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "onDisplay", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find all art pieces that are on display and calculate the total current valuation of these pieces using the `onDisplay` property for filtering and `currentValuation` property for aggregation.", + "target_collection": "ArtPieces", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "onDisplay", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "currentValuation", + "metrics": "SUM" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 302, + "database_schema_index": 4, + "natural_language_query": "Retrieve a list of all museums that are open today, group them by the museumName, and within each group, count the occurrence of each unique exhibitHighlights.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Retrieve a list of all museums that are open today, group them by the museumName, and within each group, count the occurrence of each unique exhibitHighlights.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Retrieve a list of all museums that are open today, group them by the museumName, and within each group, count the occurrence of each unique exhibitHighlights.", + "target_collection": "Museums", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 1000 + }, + "boolean_property_aggregation": null, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 303, + "database_schema_index": 4, + "natural_language_query": "Find museums in the Museums collection that are open today (using the 'openToday' boolean property filter), and determine the most common exhibit highlights among them (using text property aggregation on 'exhibitHighlights').", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums in the Museums collection that are open today (using the 'openToday' boolean property filter), and determine the most common exhibit highlights among them (using text property aggregation on 'exhibitHighlights').", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": null + }, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums in the Museums collection that are open today (using the 'openToday' boolean property filter), and determine the most common exhibit highlights among them (using text property aggregation on 'exhibitHighlights').", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 10 + }, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 304, + "database_schema_index": 4, + "natural_language_query": "Show the percentage of exhibitions on 'exhibitionTitle' that are currently running. Group the results by exhibitionTitle to determine which specific exhibitions have the highest visitor count while currentlyRunning.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Show the percentage of exhibitions on 'exhibitionTitle' that are currently running. Group the results by exhibitionTitle to determine which specific exhibitions have the highest visitor count while currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyRunning", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": { + "corresponding_natural_language_query": "Show the percentage of exhibitions on 'exhibitionTitle' that are currently running. Group the results by exhibitionTitle to determine which specific exhibitions have the highest visitor count while currentlyRunning.", + "target_collection": "Exhibitions", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "visitorCount", + "metrics": "MAX" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "currentlyRunning", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": "exhibitionTitle", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 305, + "database_schema_index": 4, + "natural_language_query": "Count how many exhibitions are currently open to the public and find those that are open.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Count how many exhibitions are currently open to the public and find those that are open.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "currentlyRunning", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Count how many exhibitions are currently open to the public and find those that are open.", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "isOpen", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.9500000000000001, + "error": null + }, + { + "query_index": 306, + "database_schema_index": 4, + "natural_language_query": "List all museums that are open today and group them by their entry fee.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "List all museums that are open today and group them by their entry fee.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "entryFee" + }, + "predicted_query": { + "corresponding_natural_language_query": "List all museums that are open today and group them by their entry fee.", + "target_collection": "Museums", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "entryFee", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 307, + "database_schema_index": 4, + "natural_language_query": "Find museums where the openToday flag is set to true.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find museums where the openToday flag is set to true.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Find museums where the openToday flag is set to true.", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 308, + "database_schema_index": 4, + "natural_language_query": "For each unique exhibitionTitle, determine the count of exhibitions that are currently running by aggregating over the currentlyRunning property and grouping the results by exhibitionTitle.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "For each unique exhibitionTitle, determine the count of exhibitions that are currently running by aggregating over the currentlyRunning property and grouping the results by exhibitionTitle.", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "exhibitionTitle" + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "2 validation errors for IntAggregation\nproperty_name\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing\nmetrics\n Field required [type=missing, input_value={}, input_type=dict]\n For further information visit https://errors.pydantic.dev/2.10/v/missing" + }, + { + "query_index": 309, + "database_schema_index": 4, + "natural_language_query": "What is the mean of the averageVisitorCount in the Exhibitions collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "What is the mean of the averageVisitorCount in the Exhibitions collection?", + "target_collection": "Exhibitions", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "What is the mean of the averageVisitorCount in the Exhibitions collection?", + "target_collection": "Exhibitions", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": { + "property_name": "averageVisitorCount", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 310, + "database_schema_index": 4, + "natural_language_query": "What are the top 5 most common exhibit highlights in terms of descriptions for museums, grouped by each museum's name?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "What are the top 5 most common exhibit highlights in terms of descriptions for museums, grouped by each museum's name?", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "exhibitHighlights", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "What are the top 5 most common exhibit highlights in terms of descriptions for museums, grouped by each museum's name?", + "target_collection": "Museums", + "search_query": "exhibit highlights", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": { + "property_name": "description", + "metrics": "TOP_OCCURRENCES", + "top_occurrences_limit": 5 + }, + "boolean_property_aggregation": null, + "groupby_property": "name", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.65, + "error": null + }, + { + "query_index": 311, + "database_schema_index": 4, + "natural_language_query": "What is the count of unique museum names in the Museums collection?", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "What is the count of unique museum names in the Museums collection?", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": null + }, + "predicted_query": null, + "tool_rationale": "", + "ast_score": 0.0, + "error": "1 validation error for IntAggregation\nmetrics\n Input should be 'MIN', 'MAX', 'MEAN', 'MEDIAN', 'MODE' or 'SUM' [type=literal_error, input_value='COUNT', input_type=str]\n For further information visit https://errors.pydantic.dev/2.10/v/literal_error" + }, + { + "query_index": 312, + "database_schema_index": 4, + "natural_language_query": "Find out how many museums are open today and group this information by museumName.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Find out how many museums are open today and group this information by museumName.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "TOTAL_TRUE" + }, + "groupby_property": "museumName" + }, + "predicted_query": { + "corresponding_natural_language_query": "Find out how many museums are open today and group this information by museumName.", + "target_collection": "Museums", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "museumName", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + }, + { + "query_index": 313, + "database_schema_index": 4, + "natural_language_query": "Calculate the percentage of museums that are open today based on the openToday property.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Calculate the percentage of museums that are open today based on the openToday property.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null + }, + "predicted_query": { + "corresponding_natural_language_query": "Calculate the percentage of museums that are open today based on the openToday property.", + "target_collection": "Museums", + "search_query": null, + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": { + "property_name": "openToday", + "metrics": "PERCENTAGE_TRUE" + }, + "groupby_property": null, + "total_count": null + }, + "tool_rationale": "", + "ast_score": 1.0, + "error": null + }, + { + "query_index": 314, + "database_schema_index": 4, + "natural_language_query": "Organize museums based on whether they are open today and calculate the average entry fee for each group.", + "ground_truth_query": { + "database_schema": { + "weaviate_collections": [ + { + "name": "Museums", + "properties": [ + { + "name": "museumName", + "data_type": [ + "string" + ], + "description": "The name of the museum." + }, + { + "name": "exhibitHighlights", + "data_type": [ + "string" + ], + "description": "A detailed description of the museum's most notable exhibits and their historical significance." + }, + { + "name": "entryFee", + "data_type": [ + "number" + ], + "description": "The standard entry fee for the museum." + }, + { + "name": "openToday", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the museum is open today." + } + ], + "envisioned_use_case_overview": "The Museums schema provides an enriching database for those interested in exploring detailed cultural exhibits. Semantic search capabilities highlight unique features and historical value of the museum's collections." + }, + { + "name": "Exhibitions", + "properties": [ + { + "name": "exhibitionTitle", + "data_type": [ + "string" + ], + "description": "The title of the exhibition." + }, + { + "name": "exhibitionDescription", + "data_type": [ + "string" + ], + "description": "A comprehensive overview of the exhibition, including themes and featured artworks." + }, + { + "name": "averageVisitorCount", + "data_type": [ + "number" + ], + "description": "The average number of visitors per day for the exhibition." + }, + { + "name": "currentlyRunning", + "data_type": [ + "boolean" + ], + "description": "Indicates whether the exhibition is currently open to the public." + } + ], + "envisioned_use_case_overview": "This schema helps users discover and explore various exhibitions based on thematic interest or visitor popularity, encouraging semantic searches for immersive cultural experiences." + }, + { + "name": "ArtPieces", + "properties": [ + { + "name": "artPieceName", + "data_type": [ + "string" + ], + "description": "The name of the art piece." + }, + { + "name": "artPieceHistory", + "data_type": [ + "string" + ], + "description": "A detailed history and description of the art piece, including the artist and creation story." + }, + { + "name": "currentValuation", + "data_type": [ + "number" + ], + "description": "The current market valuation of the art piece." + }, + { + "name": "onDisplay", + "data_type": [ + "boolean" + ], + "description": "A flag indicating if the art piece is currently on display." + } + ], + "envisioned_use_case_overview": "The ArtPieces schema supports the discovery and assessment of art pieces across various museums. With semantic capabilities, users can explore artwork based on historical significance and monetary valuation." + } + ] + }, + "corresponding_natural_language_query": "Organize museums based on whether they are open today and calculate the average entry fee for each group.", + "target_collection": "Museums", + "search_query": null, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": null, + "integer_property_aggregation": null, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday" + }, + "predicted_query": { + "corresponding_natural_language_query": "Organize museums based on whether they are open today and calculate the average entry fee for each group.", + "target_collection": "Museums", + "search_query": "", + "limit": 5, + "integer_property_filter": null, + "text_property_filter": null, + "boolean_property_filter": { + "property_name": "openToday", + "operator": "=", + "value": true + }, + "integer_property_aggregation": { + "property_name": "entryFee", + "metrics": "MEAN" + }, + "text_property_aggregation": null, + "boolean_property_aggregation": null, + "groupby_property": "openToday", + "total_count": null + }, + "tool_rationale": "", + "ast_score": 0.8500000000000001, + "error": null + } + ] +} \ No newline at end of file diff --git a/src/test_gorilla/main_test.py b/src/test_gorilla/main_test.py index 71e3433..db96a62 100644 --- a/src/test_gorilla/main_test.py +++ b/src/test_gorilla/main_test.py @@ -123,7 +123,7 @@ def run(self): """Execute the experiment workflow.""" print(f"\033[92m=== Starting {self.config.experiment_type.title()} Experiment ===\033[0m") - queries = load_queries("../../data/synthetic-weaviate-queries-with-results.json") + queries = load_queries("../../data/updated-queries-with-schemas.json") detailed_results = [] per_schema_scores = {} successful_predictions = failed_predictions = 0 @@ -142,7 +142,7 @@ def run(self): # Update metrics self.total_queries += 1 self.total_ast_score += result.ast_score - if result.ast_score == 1.0: + if result.ast_score >= 0.95: self.perfect_matches += 1 # Print current metrics avg_ast = self.total_ast_score / self.total_queries @@ -162,8 +162,12 @@ def run(self): def _build_query_from_args(self, args: Dict, nl_query: str) -> WeaviateQuery: """Constructs a WeaviateQuery from tool call arguments.""" + collection_name = args["collection_name"] + if collection_name: + collection_name = collection_name[0].upper() + collection_name[1:] + return WeaviateQuery( - target_collection=args["collection_name"], + target_collection=collection_name, search_query=args.get("search_query"), integer_property_filter=self._create_model_instance(IntPropertyFilter, args.get("integer_property_filter")), text_property_filter=self._create_model_instance(TextPropertyFilter, args.get("text_property_filter")), @@ -210,12 +214,63 @@ def _process_single_query(self, idx: int, query: WeaviateQueryWithSchema) -> Que try: collections_description, collections_enum = get_collections_info(self.db_manager.client) tools = self.build_tools(collections_description, collections_enum) - + + prompt = f""" +You are a precision-focused Weaviate query generator. Your ONLY task is to output a final Weaviate query that EXACTLY matches the provided schema and NL query. Every element (collection names, property names, filter types, operators, numeric formats, aggregation metrics, and group-by properties) must be an exact match. No substitutions, derivations, or extra text is allowed. Do not reveal any internal reasoning. + +Instructions: +1. Analyze the Schema & NL Query: + • Use ONLY schema values for collection and property names (e.g., "Restaurants", "averageRating"). + • Extract the descriptive search query exactly from the NL query. + • For filters: + - Text: use Text Filter with LIKE. + - Numeric: use Integer Filter with operators (=, <, >, <=, >=) and numeric values (include .0 if required). + - Boolean: use Boolean Filter with "=" and value True. + • For aggregations, use: + - Text: TOP_OCCURRENCES. + - Numeric: MIN, MAX, MEAN, MEDIAN, MODE, or SUM. + - Boolean: TOTAL_TRUE, TOTAL_FALSE, PERCENTAGE_TRUE, or PERCENTAGE_FALSE. + • If counting objects is needed, set total_count to true (do NOT use COUNT in aggregations). + • Group By must exactly match a schema property. + +2. Verification (Internal Only): + • Confirm every element exactly matches the schema—no extra filters or modifications. + +3. Output Format (Output ONLY): +Weaviate Query Details: + Target Collection: + Search Query: + Total Count: + [Filters if any:] + • Filter Type: + • Property: + • Operator: + • Value: + [Aggregations if any:] + • Aggregation Type: + • Property: + • Metrics: + Group By: + Natural Language Query: {nl_query} + +User Query: +{nl_query} + +Available Schema (Collections and Properties): +{collections_description} + +Now, generate the final Weaviate query following these guidelines. +IMPORTANT!! Please remember, COUNT and TYPE are not valid aggregations for an IntAggregation, TextAggregation, or BooleanAggregation! +IMPORTANT!! Please remember to format your response as a function call with the arguments you have chosen. +""" + response = self.lm_service.one_step_function_selection_test( - prompt=nl_query, + prompt=prompt, tools=tools, parallel_tool_calls=self.config.parallel_tool_calls ) + print("HERE") + print(response) predicted_query = self._process_tool_response(response, nl_query) @@ -244,6 +299,8 @@ def _process_single_query(self, idx: int, query: WeaviateQueryWithSchema) -> Que ) except Exception as e: + print(e) + print(f"\033[96m{response}\033[0m") return self._create_error_result(idx, schema_idx, nl_query, query, str(e)) def _create_error_result(self, idx: int, schema_idx: int, nl_query: str, @@ -410,9 +467,9 @@ def create_experiment(config: ExperimentConfig) -> BaseExperiment: if __name__ == "__main__": # Example usage of the unified framework config = ExperimentConfig( - model_provider="together", - model_name="meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo", - api_key=os.getenv("TOGETHER_API_KEY"), + model_provider="openai", + model_name="gpt-4o", + api_key=os.getenv("OPENAI_API_KEY"), experiment_type="standard", generate_with_models=False ) diff --git a/src/utils/weaviate_fc_utils.py b/src/utils/weaviate_fc_utils.py index 7a91e1d..0993d04 100644 --- a/src/utils/weaviate_fc_utils.py +++ b/src/utils/weaviate_fc_utils.py @@ -101,7 +101,7 @@ def build_weaviate_query_tool_for_openai(collections_description: str, collectio "description": "Aggregate numeric properties using statistical functions", "properties": { "property_name": {"type": "string"}, - "metrics": {"type": "string", "enum": ["COUNT", "TYPE", "MIN", "MAX", "MEAN", "MEDIAN", "MODE", "SUM"]} + "metrics": {"type": "string", "enum": ["MIN", "MAX", "MEAN", "MEDIAN", "MODE", "SUM"]} } }, "text_property_aggregation": { @@ -109,7 +109,7 @@ def build_weaviate_query_tool_for_openai(collections_description: str, collectio "description": "Aggregate text properties using frequency analysis", "properties": { "property_name": {"type": "string"}, - "metrics": {"type": "string", "enum": ["COUNT", "TYPE", "TOP_OCCURRENCES"]}, + "metrics": {"type": "string", "enum": ["TOP_OCCURRENCES"]}, "top_occurrences_limit": {"type": "integer"} } }, @@ -118,7 +118,7 @@ def build_weaviate_query_tool_for_openai(collections_description: str, collectio "description": "Aggregate boolean properties using statistical functions", "properties": { "property_name": {"type": "string"}, - "metrics": {"type": "string", "enum": ["COUNT", "TYPE", "TOTAL_TRUE", "TOTAL_FALSE", "PERCENTAGE_TRUE", "PERCENTAGE_FALSE"]} + "metrics": {"type": "string", "enum": ["TOTAL_TRUE", "TOTAL_FALSE", "PERCENTAGE_TRUE", "PERCENTAGE_FALSE"]} } }, "groupby_property": { @@ -186,7 +186,7 @@ def build_weaviate_query_tool_for_anthropic(collections_description: str, collec "description": "Aggregate numeric properties using statistical functions", "properties": { "property_name": {"type": "string"}, - "metrics": {"type": "string", "enum": ["COUNT", "TYPE", "MIN", "MAX", "MEAN", "MEDIAN", "MODE", "SUM"]} + "metrics": {"type": "string", "enum": ["MIN", "MAX", "MEAN", "MEDIAN", "MODE", "SUM"]} } }, "text_property_aggregation": { @@ -194,7 +194,7 @@ def build_weaviate_query_tool_for_anthropic(collections_description: str, collec "description": "Aggregate text properties using frequency analysis", "properties": { "property_name": {"type": "string"}, - "metrics": {"type": "string", "enum": ["COUNT", "TYPE", "TOP_OCCURRENCES"]}, + "metrics": {"type": "string", "enum": ["TOP_OCCURRENCES"]}, "top_occurrences_limit": {"type": "integer"} } }, @@ -203,7 +203,7 @@ def build_weaviate_query_tool_for_anthropic(collections_description: str, collec "description": "Aggregate boolean properties using statistical functions", "properties": { "property_name": {"type": "string"}, - "metrics": {"type": "string", "enum": ["COUNT", "TYPE", "TOTAL_TRUE", "TOTAL_FALSE", "PERCENTAGE_TRUE", "PERCENTAGE_FALSE"]} + "metrics": {"type": "string", "enum": ["TOTAL_TRUE", "TOTAL_FALSE", "PERCENTAGE_TRUE", "PERCENTAGE_FALSE"]} } }, "groupby_property": { @@ -267,7 +267,7 @@ def build_weaviate_query_tool_for_ollama(collections_description: str, collectio "type": "object", "properties": { "property_name": {"type": "string"}, - "metrics": {"type": "string", "enum": ["COUNT", "TYPE", "MIN", "MAX", "MEAN", "MEDIAN", "MODE", "SUM"]} + "metrics": {"type": "string", "enum": ["MIN", "MAX", "MEAN", "MEDIAN", "MODE", "SUM"]} }, "required": ["property_name", "metrics"] }, @@ -275,7 +275,7 @@ def build_weaviate_query_tool_for_ollama(collections_description: str, collectio "type": "object", "properties": { "property_name": {"type": "string"}, - "metrics": {"type": "string", "enum": ["COUNT", "TYPE", "TOP_OCCURRENCES"]}, + "metrics": {"type": "string", "enum": ["TOP_OCCURRENCES"]}, "top_occurrences_limit": {"type": "integer"} }, "required": ["property_name", "metrics"] @@ -284,7 +284,7 @@ def build_weaviate_query_tool_for_ollama(collections_description: str, collectio "type": "object", "properties": { "property_name": {"type": "string"}, - "metrics": {"type": "string", "enum": ["COUNT", "TYPE", "TOTAL_TRUE", "TOTAL_FALSE", "PERCENTAGE_TRUE", "PERCENTAGE_FALSE"]} + "metrics": {"type": "string", "enum": ["TOTAL_TRUE", "TOTAL_FALSE", "PERCENTAGE_TRUE", "PERCENTAGE_FALSE"]} }, "required": ["property_name", "metrics"] }, @@ -350,7 +350,7 @@ def build_weaviate_query_tool_for_cohere(collections_description: str, collectio "description": "Aggregate numeric properties using statistical functions", "properties": { "property_name": {"type": "string"}, - "metrics": {"type": "string", "enum": ["COUNT", "TYPE", "MIN", "MAX", "MEAN", "MEDIAN", "MODE", "SUM"]} + "metrics": {"type": "string", "enum": ["MIN", "MAX", "MEAN", "MEDIAN", "MODE", "SUM"]} } }, "text_property_aggregation": { @@ -358,7 +358,7 @@ def build_weaviate_query_tool_for_cohere(collections_description: str, collectio "description": "Aggregate text properties using frequency analysis", "properties": { "property_name": {"type": "string"}, - "metrics": {"type": "string", "enum": ["COUNT", "TYPE", "TOP_OCCURRENCES"]}, + "metrics": {"type": "string", "enum": ["TOP_OCCURRENCES"]}, "top_occurrences_limit": {"type": "integer"} } }, @@ -367,7 +367,7 @@ def build_weaviate_query_tool_for_cohere(collections_description: str, collectio "description": "Aggregate boolean properties using statistical functions", "properties": { "property_name": {"type": "string"}, - "metrics": {"type": "string", "enum": ["COUNT", "TYPE", "TOTAL_TRUE", "TOTAL_FALSE", "PERCENTAGE_TRUE", "PERCENTAGE_FALSE"]} + "metrics": {"type": "string", "enum": ["TOTAL_TRUE", "TOTAL_FALSE", "PERCENTAGE_TRUE", "PERCENTAGE_FALSE"]} } }, "groupby_property": { @@ -435,7 +435,7 @@ def build_weaviate_query_tool_for_together(collections_description: str, collect "description": "Aggregate numeric properties using statistical functions", "properties": { "property_name": {"type": "string"}, - "metrics": {"type": "string", "enum": ["COUNT", "TYPE", "MIN", "MAX", "MEAN", "MEDIAN", "MODE", "SUM"]} + "metrics": {"type": "string", "enum": ["MIN", "MAX", "MEAN", "MEDIAN", "MODE", "SUM"]} } }, "text_property_aggregation": { @@ -443,7 +443,7 @@ def build_weaviate_query_tool_for_together(collections_description: str, collect "description": "Aggregate text properties using frequency analysis", "properties": { "property_name": {"type": "string"}, - "metrics": {"type": "string", "enum": ["COUNT", "TYPE", "TOP_OCCURRENCES"]}, + "metrics": {"type": "string", "enum": ["TOP_OCCURRENCES"]}, "top_occurrences_limit": {"type": "integer"} } }, @@ -452,7 +452,7 @@ def build_weaviate_query_tool_for_together(collections_description: str, collect "description": "Aggregate boolean properties using statistical functions", "properties": { "property_name": {"type": "string"}, - "metrics": {"type": "string", "enum": ["COUNT", "TYPE", "TOTAL_TRUE", "TOTAL_FALSE", "PERCENTAGE_TRUE", "PERCENTAGE_FALSE"]} + "metrics": {"type": "string", "enum": ["TOTAL_TRUE", "TOTAL_FALSE", "PERCENTAGE_TRUE", "PERCENTAGE_FALSE"]} } }, "groupby_property": {