tdoehmen's picture
added duckdb-nsql benchmark setup
b247dc4
raw
history blame
27.5 kB
[
{
"db_id": "hn",
"query": "SELECT COUNT(*) as domain_count, \nSUBSTRING(SPLIT_PART(url, '//', 2), 1, POSITION('/' IN SPLIT_PART(url, '//', 2)) - 1) as domain \nFROM hacker_news\nWHERE url IS NOT NULL GROUP BY domain ORDER BY domain_count DESC LIMIT 10;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "what are the top domains being shared on hacker_news?",
"category": "hard"
},
{
"db_id": "laptop",
"query": "SELECT c.firstname, c.lastname, COUNT(*) AS num_pcs_bought\nFROM customers c\nJOIN sales s ON c.customer_id = s.customer_id\nJOIN pcs p ON s.model = p.model\nGROUP BY c.customer_id, c.firstname, c.lastname\nORDER BY num_pcs_bought DESC\nLIMIT 1;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "Who bought the most PCs, print also the users name?",
"category": "medium"
},
{
"db_id": "transactions",
"query": "select users.id, users.name, sum(transactions.amount) as balance from users join transactions on users.id = transactions.user_id group by users.id, users.name having balance = 0",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "list the names off account holders who have negative balances",
"category": "easy"
},
{
"db_id": "laptop",
"query": "SELECT model FROM products WHERE maker = 'B';",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "List only the model number of all products made by maker B.",
"category": "easy"
},
{
"db_id": "laptop",
"query": "SELECT model FROM products WHERE maker <> 'B';",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "List the model numbers of all products not made by maker B.",
"category": "easy"
},
{
"db_id": "laptop",
"query": "SELECT AVG(speed) FROM pcs WHERE speed >= 3.00",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "Return the average speed all PCs with speed >= 3.00",
"category": "easy"
},
{
"db_id": "laptop",
"query": "SELECT MAX(price) FROM printers WHERE color = 'TRUE' AND type='laser'",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "Return the price of the most expensive color laser printer",
"category": "medium"
},
{
"db_id": "laptop",
"query": "SELECT MIN(paid) FROM sales WHERE type_of_payment LIKE '%visa%'",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "Return the minimum amount paid by customers who used a visa card (debit or credit) to purchase a product",
"category": "medium"
},
{
"db_id": "laptop",
"query": "SELECT customer_id FROM customers WHERE firstname LIKE '%e%' OR lastname LIKE '%e%'",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "Find the customer_id of customers who have the letter 'e' either in their first name or in their last name",
"category": "medium"
},
{
"db_id": "laptop",
"query": "SELECT model, price/0.85 AS 'price (USD)' FROM laptops WHERE ram >= 1024",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "Assume all prices in the table Laptops are in Euro. List the prices of laptops with at least 1024 ram. You should return the price in USD in a column called 'price (USD)'. Assume that 1 USD = 0.85 EURO. Name the price column 'price (USD)'.",
"category": "hard"
},
{
"db_id": "laptop",
"query": "SELECT maker FROM products GROUP BY maker HAVING COUNT(maker) > 4;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "Return a list of makers that make more than four different products.",
"category": "medium"
},
{
"db_id": "laptop",
"query": "SELECT model FROM laptops WHERE speed > 1.7 ORDER BY speed DESC;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "List all the laptop model numbers that have a speed greater than 1.7 in descending order of speed.",
"category": "medium"
},
{
"db_id": "laptop",
"query": "SELECT firstname \n FROM sales \n JOIN customers ON sales.customer_id = customers.customer_id \n GROUP BY firstname \n ORDER BY COUNT(firstname);",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "List firstnames of customers in an ascending order based on the number of purchases made by customers with this firstname.",
"category": "medium"
},
{
"db_id": "laptop",
"query": "SELECT DISTINCT maker FROM products JOIN pcs ON products.model = pcs.model WHERE ram > 1500;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "List all the makers (with only one entry per maker) who make PCs with RAM greater than 1500.",
"category": "medium"
},
{
"db_id": "laptop",
"query": "SELECT city, AVG(paid) as 'avg_spend' FROM sales JOIN customers ON sales.customer_id = customers.customer_id GROUP BY city",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "Find the city and the average amount of money spent by customers in each city. Name the column for the amount 'avg_spend'",
"category": "medium"
},
{
"db_id": "laptop",
"query": "SELECT color, MAX(price) as 'max_price' FROM printers GROUP BY color;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "Find the maximum price for each color of printer. Name the column for the maximum price 'max_price'",
"category": "medium"
},
{
"db_id": "who",
"query": "select country_name, max(pm25_concentration) as worst_pm25_for_country\nfrom ambient_air_quality\ngroup by country_name\norder by worst_pm25_for_country desc\nlimit 1",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "Find the country with the worst single reading of air quality (highest PM 2.5 value). Show the PM 2.5 value as well.",
"category": "medium"
},
{
"db_id": "who",
"query": "select country_name, avg(pm25_concentration) as worst_avg_pm25_for_country\nfrom ambient_air_quality\ngroup by country_name\norder by worst_avg_pm25_for_country desc\nlimit 1",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "Find the country with the worst average air quality (highest PM 2.5 value). Show the PM 2.5 value as well.",
"category": "medium"
},
{
"db_id": "who",
"query": "select distinct country_name from ambient_air_quality order by country_name",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "Find all countries for which WHO air quality data is available. Sort alphabetically.",
"category": "medium"
},
{
"db_id": "who",
"query": "select year, avg(pm25_concentration) from ambient_air_quality \nwhere country_name = 'Singapore'\ngroup by year\norder by year",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "Find Singapore air quality defined as PM2.5 concentration over time",
"category": "medium"
},
{
"db_id": "nyc",
"query": "SELECT COLUMNS('^trip_') FROM rideshare LIMIT 10;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "select only the column names from the rideshare table that start with trip_ and return the first 10 values",
"category": "duckdb"
},
{
"db_id": "nyc",
"query": "SELECT * FROM rideshare USING SAMPLE 1%;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "select a 1% sample from the nyc.rideshare table",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SELECT * EXCLUDE (customer_id) FROM customers;\n",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "select all columns from the customer table, except customer_id",
"category": "duckdb"
},
{
"db_id": "nyc",
"query": "SUMMARIZE rideshare;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "show summary statistics of the rideshare table",
"category": "duckdb"
},
{
"db_id": "none",
"query": "SELECT * FROM read_csv_auto(\n'https://raw.githubusercontent.com/datasciencedojo/datasets/master/titanic.csv')",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "read a CSV from https://raw.githubusercontent.com/datasciencedojo/datasets/master/titanic.csv",
"category": "duckdb"
},
{
"db_id": "none",
"query": "COPY (SELECT * FROM read_csv_auto(\n'https://raw.githubusercontent.com/datasciencedojo/datasets/master/titanic.csv'))\nTO 'titanic.parquet' (FORMAT 'parquet');",
"setup_sql": ";",
"validation_sql": "SELECT * FROM 'titanic.parquet'",
"question": "read a CSV from https://raw.githubusercontent.com/datasciencedojo/datasets/master/titanic.csv and convert it to a parquet file called \"titanic\"",
"category": "duckdb"
},
{
"db_id": "none",
"query": "CREATE TABLE titanic AS (SELECT * FROM read_csv_auto(\n'https://raw.githubusercontent.com/datasciencedojo/datasets/master/titanic.csv'))",
"setup_sql": ";",
"validation_sql": "SELECT * FROM titanic;",
"question": "create a table called \"titanic\" from CSV file https://raw.githubusercontent.com/datasciencedojo/datasets/master/titanic.csv",
"category": "duckdb"
},
{
"db_id": "none",
"query": "PRAGMA default_null_order='NULLS LAST';",
"setup_sql": ";",
"validation_sql": "SELECT current_setting('default_null_order');",
"question": "configure duckdb to put null values last when sorting",
"category": "duckdb"
},
{
"db_id": "none",
"query": "CREATE TABLE IF NOT EXISTS products (\n maker varchar(10),\n model varchar(10),\n type varchar(10));",
"setup_sql": ";",
"validation_sql": "SELECT * FROM products;",
"question": "create a table about products, that contains a maker, model and type column",
"category": "ddl"
},
{
"db_id": "product",
"query": "INSERT INTO products (maker, model, type)\nVALUES\n ('A', '1001', 'pc');",
"setup_sql": ";",
"validation_sql": "SELECT * FROM products;",
"question": "add a row with values for model \"1001\" of type \"pc\", from maker \"A\" to products table",
"category": "ddl"
},
{
"db_id": "none",
"query": "CALL pragma_version();\n",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "get current version of duckdb",
"category": "duckdb"
},
{
"db_id": "nyc",
"query": "PRAGMA table_info('rideshare');",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "list all columns in table nyc.rideshare",
"category": "duckdb"
},
{
"db_id": "nyc",
"query": "PRAGMA show_tables;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "show all tables in the curent database",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SELECT customer_id, model, sum(paid) FROM sales GROUP BY ALL",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "how much did each customer spend per model type?",
"category": "easy"
},
{
"db_id": "nyc",
"query": "SELECT Max(datediff('minute', tpep_pickup_datetime, tpep_dropoff_datetime)) from nyc.taxi",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "What was the longest taxi ride in minutes?",
"category": "hard"
},
{
"db_id": "who",
"query": "with per_region as (\n select avg(pm10_concentration) as avg_pm10, who_region from ambient_air_quality group by who_region\n), max_region as (\n select who_region from per_region where avg_pm10 = (select max(avg_pm10) from per_region)\n), min_city_value_in_max_region as (\n select min(pm10_concentration) from ambient_air_quality where who_region in (from max_region)\n), min_city_in_max_region as (\n select city from ambient_air_quality where pm10_concentration in (from min_city_value_in_max_region) and who_region in (from max_region)\n)\nfrom min_city_in_max_region",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "What is the city with the lowest pm10 concentration in the region with the highest average pm10 concentration?",
"category": "hard"
},
{
"db_id": "hn",
"query": "SELECT *, regexp_extract(text, '([a-z0-9_\\.-]+)@([\\da-z\\.-]+)\\.([a-z\\.]{2,63})',0) email from hacker_news where email[:4]='test'",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "Get all posts on hn that contain an email address starting with test. Return all original columns, plus a new column containing the email address.",
"category": "hard"
},
{
"db_id": "json",
"query": "SELECT employee.id, employee.first_name FROM employee_json",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "Extract id and first_name properties as individual columns from the employee struct",
"category": "duckdb"
},
{
"db_id": "who",
"query": "SELECT who_region[1]::INT as region, * EXCLUDE (who_region) FROM who.ambient_air_quality",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "count quality measurements per region. Make sure to return the region code (first char of who_region) as integer and sort by region.",
"category": "duckdb"
},
{
"db_id": "flightinfo",
"query": "SELECT seat.seat_number FROM seat \nJOIN direct_flight ON direct_flight.flight_number = seat.flight_number \nJOIN airport AS departure_airport ON departure_airport.iata_code = direct_flight.departure_airport_iata_code \nJOIN airport AS arriving_airport ON arriving_airport.iata_code = direct_flight.arriving_airport_iata_code \nJOIN city AS departure_city ON departure_city.city_zipcode = departure_airport.city_zip_code \nJOIN city AS arriving_city ON arriving_city.city_zipcode = arriving_airport.city_zip_code \nWHERE departure_city.city_name = 'Bruxelles' AND arriving_city.city_name = 'Newark';",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "Which seats were available on the flight from Bruxelles to Newark?",
"category": "hard"
},
{
"db_id": "laptop",
"query": "COPY customers FROM 'customers_12_12_2023.csv';",
"setup_sql": "COPY customers TO 'customers_12_12_2023.csv';",
"validation_sql": "SELECT * FROM customers;",
"question": "copy content of csv file customers_12_12_2023.csv into customers table",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "COPY customers FROM 'customers_12_12_2023.csv' (DELIMITER '\\t');",
"setup_sql": "COPY customers TO 'customers_12_12_2023.csv' (FORMAT CSV, DELIMITER '\\t');",
"validation_sql": "SELECT * FROM customers;",
"question": "copy content of csv file costomers_12_12_2023.csv into customers table with tab separator",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "COPY customers FROM 'customers_partitioned/city=Amsterdam/*.parquet';",
"setup_sql": "COPY customers TO 'customers_partitioned' (FORMAT PARQUET, PARTITION_BY (city), OVERWRITE_OR_IGNORE True);",
"validation_sql": "SELECT * FROM customers;;",
"question": "copy any parquet files from 'customers_partitioned/city=Amsterdam/' into customers table",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "COPY customers(customer_id) FROM 'customers_customer_ids.csv';",
"setup_sql": "COPY customers(customer_id) TO 'customers_customer_ids.csv';",
"validation_sql": "SELECT * FROM customers;",
"question": "copy only the customer_id column from the customers_customer_ids.csv into the customers tables",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "CREATE TABLE test_tbl AS SELECT * FROM read_json_auto('test.json');",
"setup_sql": "COPY customers TO 'test.json'\n",
"validation_sql": "SELECT * FROM test_tbl;",
"question": "read json file from test.json and create new table from it called 'test_tbl'",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SELECT * FROM read_csv_auto('test.csv');",
"setup_sql": "COPY customers TO 'test.csv';",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "read csv from test.csv",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SELECT * FROM read_csv_auto('test.csv', columns={'customer_id': 'VARCHAR', 'firstname': 'VARCHAR', 'lastname': 'VARCHAR'});",
"setup_sql": "COPY customers(customer_id, firstname, lastname) TO 'test.csv';",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "read csv from test.csv with predefined column and types - customer_id: string, firstname: string, lastname: string",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SELECT * EXCLUDE (ram, hd) FROM pcs;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "select all columns from pcs table except for ram and hd",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SELECT COLUMNS('name$') FROM customers;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "select all columns ending with 'name' from customers table",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SELECT LENGTH(COLUMNS('name$')) FROM customers",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "for each column ending with 'name' in the customers table, compute the string length",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SELECT * REPLACE (upper(city) AS city) FROM customers;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "get all columns from customer table, and make all city names uppercase",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "EXPLAIN SELECT * FROM customers",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "show query plan for query: SELECT * from customers",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SELECT ascii(lastname) FROM customers;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "get the first character of the firstname column and cast it to an INT",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SELECT model, speed::INTEGER FROM laptops;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "get laptop name and speed, return the speed as integer",
"category": "duckdb"
},
{
"db_id": "laptop_array",
"query": "SELECT phone_numbers[1] FROM customers;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "get the first phone number of each customer",
"category": "duckdb"
},
{
"db_id": "laptop_array",
"query": "INSERT INTO customers(customer_id, phone_numbers) VALUES (5, ['12312323', '23123344']);",
"setup_sql": ";",
"validation_sql": "SELECT * FROM customers;",
"question": "insert two phone numbers to customer with id 5 [\\\"12312323\\\", and '23123344']",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "ALTER TABLE customers ADD COLUMN phone_numbers VARCHAR[];",
"setup_sql": ";",
"validation_sql": "DESCRIBE customers;",
"question": "how to add a new column phone_numbers to the customers table, with array type varchar",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SELECT firstname[1] FROM customers;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "get the first letter of the customers firstname",
"category": "duckdb"
},
{
"db_id": "laptop_array",
"query": "SELECT phone_numbers[:2] FROM customers;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "get the first two phone numbers from the phone numbers array of each customer",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SELECT {'a':1, 'b':2, 'c':3};",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "create a struct with keys a, b, c and values 1,2,3",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SELECT [1,2,3];\n",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "create array with values 1,2,3",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "CREATE TABLE test (embeddings FLOAT[100]);",
"setup_sql": ";",
"validation_sql": "DESCRIBE test;",
"question": "create table test with a fix-sized array column with 100 dimenions, called embeddings",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "CREATE TABLE test (person STRUCT(name VARCHAR, id INTEGER));",
"setup_sql": ";",
"validation_sql": "DESCRIBE test;",
"question": "create table test with a struct column called person with properties name and id",
"category": "duckdb"
},
{
"db_id": "laptop_struct",
"query": "SELECT person.name, person.id FROM test;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "get persons name and persons id from the test table.",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "UPDATE customers SET email = NULL;",
"setup_sql": ";",
"validation_sql": "SELECT email FROM customers;",
"question": "remove all values from email column in customers table",
"category": "duckdb"
},
{
"db_id": "laptop_json",
"query": "ALTER TABLE customers ALTER COLUMN email SET DATA TYPE VARCHAR;",
"setup_sql": ";",
"validation_sql": "DESCRIBE customers;",
"question": "make customer email of type VARCHAR",
"category": "duckdb"
},
{
"db_id": "laptop_json",
"query": "INSERT INTO customers (customer_id, email) VALUES (5,'{\"from\": \"[email protected]\", \"to\": \"[email protected]\"}');",
"setup_sql": ";",
"validation_sql": "SELECT * FROM customers;",
"question": "insert json into customer email for customer id 5: {'from': '[email protected]', 'to': '[email protected]'}",
"category": "duckdb"
},
{
"db_id": "laptop_json",
"query": "SELECT customers.email->>'from' FROM customers;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "get 'from' field from customer email json",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SUMMARIZE customers;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "summarize the customer table",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SELECT * FROM customers USING SAMPLE 10% (reservoir);",
"setup_sql": ";",
"validation_sql": "SELECT count(*) FROM ddb_benchmark_result;",
"question": "sample 10% from the customers table using reservoir sampling",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SET threads = 10;",
"setup_sql": ";",
"validation_sql": "SELECT current_setting('threads');",
"question": "set number of threads to 10",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SET memory_limit = '20G';\n",
"setup_sql": ";",
"validation_sql": "SELECT current_setting('memory_limit');",
"question": "set memory limit to 20 gigabyte",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SELECT * EXCLUDE (price), avg(price) FROM laptops GROUP BY ALL;",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "show the average price of laptop and group by the remaining columns",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "SELECT * FROM laptops WHERE price > 1000 ORDER BY ALL;\n",
"setup_sql": ";",
"validation_sql": "SELECT * FROM ddb_benchmark_result;",
"question": "show all laptops with price above 1000 and order by all columns",
"category": "duckdb"
},
{
"db_id": "laptop",
"query": "ATTACH 'who.ddb';",
"setup_sql": ";",
"validation_sql": "SHOW DATABASES;",
"question": "attach database file who.ddb",
"category": "duckdb"
}
]