turso

mirror of https://github.com/aljazceru/turso.git synced 2026-01-11 12:14:21 +01:00

Author	SHA1	Message	Date
joao.faria	2ba643cd68	fix: prevent DROP TABLE when table is referenced by foreign keys Add foreign key constraint check in translate_drop_table to reject dropping tables that are referenced by foreign keys when PRAGMA foreign_keys=ON	2025-11-04 12:32:19 -03:00
Pekka Enberg	2bf5eb84cf	Merge 'Prevent misuse of subqueries that return multiple columns' from Jussi Saurio Closes #3892 Closes #3888 Stuff like: ```sql turso> create table t1(x); create table t2(y, z); insert into t1 values (1); insert into t2 values (1, 2); select case (select y, z from t2) when 1 then 'one' else 'other' end from t1; × Parse error: base expression in CASE must return 1 value turso> create table t(x, y); insert into t values (1, 2); select (select x, y from t) as result; × Parse error: result column must return 1 value, got 2 turso> create table t1(x,y); create table t2(y); insert into t1 values (1,1); insert into t2 values (1); select * from t2 where y = (select x,y from t1); × Parse error: all arguments to binary operator = must return the same number of │ values. Got: (1) = (2) turso> create table orders(customer_id, amount); create table thresholds(min_amount, max_amount); insert into orders values (100, 50), (100, 150); insert into thresholds values (100, 200); select customer_id, sum(amount) as total from orders group by customer_id having total > (select min_amount, max_amount from thresholds); × Parse error: all arguments to binary operator > must return the same number of │ values. Got: (1) > (2) turso> create table items(id); create table config(max_results, other_col); insert into items values (1), (2), (3); insert into config values (2, 3); select * from items limit (select max_results, other_col from config); × Parse error: limit expression must return 1 value, got 2 turso> create table items(id); create table config(skip_count, other_col); insert into items values (1), (2), (3); insert into config values (1, 2); select * from items limit 1 offset (select skip_count, other_col from config); × Parse error: offset expression must return 1 value, got 2 turso> create table items(id, name); create table sort_order(priority, other_col); insert into items values (1, 'a'), (2, 'b'); insert into sort_order values (1, 2); select * from items order by (select priority, other_col from sort_order); × Parse error: order by expression must return 1 value, got 2 turso> create table sales(product_id, amount); create table grouping(category, other_col); insert into sales values (1, 100), (2, 200); insert into grouping values (1, 2); select sum(amount) from sales group by (select category, other_col from grouping); × Parse error: group by expression must return 1 value, got 2 turso> create table t1(x); create table t2(y, z); insert into t1 values (1); insert into t2 values (1, 2); select case when (select y, z from t2) then 'yes' else 'no' end from t1; × Parse error: when expression in CASE must return 1 value. Got: (2) turso> create table t1(x); create table t2(y, z); insert into t1 values (1); insert into t2 values (1, 2); select case when x = 1 then (select y, z from t2) else 0 end from t1; × Parse error: then expression in CASE must return 1 value. Got: (2) turso> create table t1(x); create table t2(y, z); insert into t1 values (1); insert into t2 values (1, 2); select case when x = 2 then 0 else (select y, z from t2) end from t1; × Parse error: else expression in CASE must return 1 value. Got: (2) turso> create table t1(x); create table t2(y, z); insert into t1 values (1); insert into t2 values (1, 2); select max((select y, z from t2)) from t1; × Parse error: argument 0 to function call max must return 1 value. Got: (2) turso> create table t1(x); create table t2(y, z); insert into t1 values (1); insert into t2 values (1, 2); select x + (select y, z from t2) from t1; × Parse error: all arguments to binary operator + must return the same number of │ values. Got: (1) + (2) turso> create table t1(x); create table t2(y, z); insert into t1 values (5); insert into t2 values (1, 2); select * from t1 where x between (select y, z from t2) and 10; × Parse error: all arguments to binary operator <= must return the same number of │ values. Got: (2) <= (1) turso> create table t1(x); create table t2(y, z); insert into t1 values (1); insert into t2 values (1, 2); select cast((select y, z from t2) as integer) from t1; × Parse error: argument to CAST must return 1 value. Got: (2) turso> create table t1(x); create table t2(y, z); insert into t1 values (1); insert into t2 values ('a', 'b'); select (select y, z from t2) collate nocase from t1; × Parse error: argument to COLLATE must return 1 value. Got: (2) turso> create table t1(x); create table t2(y, z); insert into t1 values (1); insert into t2 values (1, 2); select * from t1 where (select y, z from t2) is null; × Parse error: all arguments to binary operator IS must return the same number of │ values. Got: (2) IS (1) turso> create table t1(x); create table t2(y, z); insert into t1 values (1); insert into t2 values (1, 2); select * from t1 where (select y, z from t2) not null; × Parse error: argument to NOT NULL must return 1 value. Got: (2) turso> create table t1(x); create table t2(y, z); insert into t1 values (1); insert into t2 values ('a', 'b'); select * from t1 where (select y, z from t2) like 'a%'; × Parse error: left operand of LIKE must return 1 value. Got: (2) turso> create table t1(x); create table t2(y, z); insert into t1 values (1); insert into t2 values (1, 2); select -(select y, z from t2) from t1; × Parse error: argument to unary operator - must return 1 value. Got: (2) turso> create table t1(x); create table t2(y, z); insert into t1 values (1); insert into t2 values (1, 2); select abs((select y, z from t2)) from t1; × Parse error: argument 0 to function call abs must return 1 value. Got: (2) ``` Closes #3906	2025-11-03 13:06:38 +02:00
Pekka Enberg	9aae220509	Merge 'Optimize and refactor schema::Column type' from Preston Thorpe closes https://github.com/tursodatabase/turso/issues/3773 ## Before ```rust #[derive(Debug, Clone)] pub struct Column { pub name: Option<String>, pub ty: Type, // many sqlite operations like table_info retain the original string pub ty_str: String, pub primary_key: bool, pub is_rowid_alias: bool, pub notnull: bool, pub default: Option<Box<Expr>>, pub unique: bool, pub collation: Option<CollationSeq>, pub hidden: bool, } ``` obviously not ideal. so lets pack `type`, `hidden`, `primary_key`, `is_rowid_alias`, `notnull` and `collation` into a u16. ## After: ```rust #[derive(Debug, Clone)] pub struct Column { pub name: Option<String>, pub ty_str: String, pub default: Option<Box<Expr>>, raw: u16, } ``` Also saw a place to replace a `Mutex<Enum>` with `AtomicEnum`, so I snuck that in here too Reviewed-by: Jussi Saurio <jussi.saurio@gmail.com> Closes #3905	2025-11-03 13:05:35 +02:00
Jussi Saurio	1c2a8e62ca	Fix: return error on provided insert column count mismatch	2025-11-03 11:41:50 +02:00
Jussi Saurio	005d922ab4	Fix: prevent misuse of subqueries that return multiple columns	2025-11-03 11:04:09 +02:00
PThorpe92	481d86f567	Optimize and refactor schema::Column type	2025-11-02 20:46:02 -05:00
Pekka Enberg	72edc6d758	Merge 'Clean up Connection::from_uri() by using DatabaseOpts' from Rohith Suresh Fixes #3900 Migrating the `from_uri` function to use `DatabaseOpts` Reviewed-by: Preston Thorpe <preston@turso.tech> Closes #3901	2025-11-02 16:55:44 +02:00
pedrocarlo	28c52cdf09	pass the left select in compound select to correctly choose the collation sequence	2025-11-02 11:26:48 -03:00
RS2007	60cbc6d8ea	migrating from_uri to database opts	2025-11-02 16:28:22 +05:30
Pekka Enberg	913b7ac600	core: Disable autovacuum by default People have discovered various bugs in autovacuum so let's disable it by default for now.	2025-11-02 12:09:21 +02:00
PThorpe92	23496f0bea	Fix incorrect unreachable precondition for affinity char in op_seek_rowid	2025-11-01 20:43:44 -04:00
Pekka Enberg	c091f94de8	Merge 'Fix INSERT UNION ALL' from Duy Dang Close #3849 Close #3855 Reviewed-by: Jussi Saurio <jussi.saurio@gmail.com> Closes #3877	2025-11-01 11:12:38 +02:00
Pekka Enberg	7283f35a29	Merge 'Fix LEFT JOIN subqueries reusing stale right-side values' from Duy Dang Close #3867 Reviewed-by: Jussi Saurio <jussi.saurio@gmail.com> Closes #3874	2025-11-01 11:12:24 +02:00
Duy Dang	e0f6b7cffe	Fix INSERT handling for compound VALUES sources	2025-11-01 02:27:42 +07:00
Duy Dang	4b18e3bab5	Fix VALUES UNION ALL register reuse during INSERTs	2025-11-01 02:01:30 +07:00
Duy Dang	3ee47a2c3c	Fix LEFT JOIN subqueries reusing stale right-side values	2025-11-01 01:24:31 +07:00
RS2007	7fff8daaa5	Fixing clippy error	2025-10-31 23:14:08 +05:30
RS2007	1f576593ec	adding duplicate cte name checks in planner.rs	2025-10-31 23:14:08 +05:30
Duy Dang	733dc762ed	Fix self-insert SUM when table uses INTEGER PRIMARY KEY	2025-10-31 03:34:10 +07:00
Pekka Enberg	eaff2d135f	Merge 'Fix database state going back in time after sync' from Nikita Sivukhin This PR fixes sync engine bug which leads to the state of db going back in time. The mistake was made in the pull operation which before fetched information about last commited changes to the remote separately. This crates a problem since pull already works with fixed WAL updates received earlier from remote - and this WAL update can be inconsistent with more fresh value of last_change_id fetched from remote. The fix is to use only WAL update and "extract" necessary information from it. In order to do that sync now read meta sync table while pull operation is in progress (at the moment when local changes are rolled back and remote changes already applied) and do not use any external source to consume that information. Also, this PR fixes bug in the JS tursodatabase client and reset statement in the finally block opposed to the previous approach to reset statement at the beginning. The problem with previous approach were in cases when client do not fully consumed the statement (e.g. abort iteration and take only one row) in which case the statement will be kept active and can prevent another write transaction from starting or just occupy place as a read transaction. Closes #3860	2025-10-29 17:53:45 +02:00
Jussi Saurio	6cf2072b51	translate: disallow correlated subqueries in HAVING and ORDER BY These are supported by SQLite, but we cannot handle them correctly yet.	2025-10-29 15:37:19 +02:00
Nikita Sivukhin	4c98861590	adjust logs	2025-10-29 16:24:05 +04:00
Jussi Saurio	96990e1168	Merge 'Stmt reset cursors' from Nikita Sivukhin This PR reset cursor state in the `stmt.reset()` method because under the hood statement caches some BTree state which can be no longer valid at the moment of next statement run. Reviewed-by: Preston Thorpe <preston@turso.tech> Closes #3859	2025-10-29 14:04:52 +02:00
Nikita Sivukhin	a2d11f9263	reset cursors when statement is reseted	2025-10-29 15:13:00 +04:00
Nikita Sivukhin	9629e2f26a	reset move_to_right_state cached state in case of quick balancing	2025-10-29 14:58:42 +04:00
Jussi Saurio	4bf8ad8cfd	Merge 'Support subqueries in all positions of a SELECT statement' from Jussi Saurio Follow-up to #3847. Adds support for subqueries in all other positions of a SELECT (the result list, GROUP BY, ORDER BY, HAVING, LIMIT, OFFSET). Turns out I am a sql noob and didn't realize that correlated subqueries are supported in basically all positions except LIMIT/OFFSET, so added support for those too + accompanying TCL tests. Thankfully the abstractions introduced in #3847 carry over to this very well so the code change is relatively small (over half of the diff is tests and a lot of the remaining diff is just moving logic around). Reviewed-by: Preston Thorpe <preston@turso.tech> Closes #3852	2025-10-29 10:19:39 +02:00
Jussi Saurio	fcb927ed24	Merge 'Initialize LIMIT after after ORDER BY / GROUP BY initialization' from Jussi Saurio Closes #3853 Currently LIMIT 0 jumps to "after the main loop", and it is done before ORDER BY and GROUP BY cursor have had a chance to be initialized, which causes a panic. Simplest fix for now is to delay the LIMIT initialization. Reviewed-by: Preston Thorpe <preston@turso.tech> Closes #3854	2025-10-29 10:17:05 +02:00
Jussi Saurio	29fe3b585a	Add more tests and disable correlated IN-subqueries in HAVING position I discovered a flaw in our current translation that makes queries of type HAVING foo IN (SELECT ...) not work properly - in these cases we need to defer translation of the subquery until later. I will fix this in a future PR because I suspect it's not trivial.	2025-10-29 09:57:55 +02:00
Jussi Saurio	ad723b615f	Merge 'index_method: fully integrate into query planner' from Nikita Sivukhin This PR completely integrate custom indices to the query planner. In order to do that new `Cursor::IndexMethod` is introduced with few correlated changes in the VM implementation: 1. Added special `IndexMethod{Create,Destroy,Query}` opcodes to handle index method creation, deletion and query 2. `Next` , `IdxRowid` , `IdxInsert`, `IdxDelete` opcodes updated to properly handle new cursor case Reviewed-by: Jussi Saurio <jussi.saurio@gmail.com> Closes #3827	2025-10-29 09:42:37 +02:00
Pekka Enberg	dae2930743	Merge 'core: Switch to FxHash to improve performance' from Pekka Enberg The default Rust hash map is slow for integer keys. Switch to FxHash instead to reduce executed instructions for, for example, throughput benchmark. Before: ``` penberg@turing:~/src/tursodatabase/turso/perf/throughput/turso$ perf stat ../../../target/release/write-throughput --threads 1 --batch-size 100 --compute 0 -i 10000 Turso,1,100,0,106875.21 Performance counter stats for '../../../target/release/write-throughput --threads 1 --batch-size 100 --compute 0 -i 10000': 2,908.02 msec task-clock # 0.310 CPUs utilized 30,508 context-switches # 10.491 K/sec 261 cpu-migrations # 89.752 /sec 813 page-faults # 279.572 /sec 20,655,313,128 instructions # 1.73 insn per cycle # 0.14 stalled cycles per insn 11,930,088,949 cycles # 4.102 GHz 2,845,040,381 stalled-cycles-frontend # 23.85% frontend cycles idle 3,814,652,892 branches # 1.312 G/sec 54,760,600 branch-misses # 1.44% of all branches 9.372979876 seconds time elapsed 2.276835000 seconds user 0.530135000 seconds sys ``` After: ``` penberg@turing:~/src/tursodatabase/turso/perf/throughput/turso$ perf stat ../../../target/release/write-throughput --threads 1 --batch-size 100 --compute 0 -i 10000 Turso,1,100,0,108663.84 Performance counter stats for '../../../target/release/write-throughput --threads 1 --batch-size 100 --compute 0 -i 10000': 2,838.65 msec task-clock # 0.308 CPUs utilized 30,629 context-switches # 10.790 K/sec 351 cpu-migrations # 123.650 /sec 818 page-faults # 288.165 /sec 19,887,102,451 instructions # 1.72 insn per cycle # 0.14 stalled cycles per insn 11,593,166,024 cycles # 4.084 GHz 2,830,298,617 stalled-cycles-frontend # 24.41% frontend cycles idle 3,764,334,333 branches # 1.326 G/sec 53,157,766 branch-misses # 1.41% of all branches 9.218225731 seconds time elapsed 2.231889000 seconds user 0.508785000 seconds sys ``` Closes #3837	2025-10-28 14:49:09 +02:00
Pekka Enberg	810ed8ad60	Merge 'Don't allow autovacuum to be flipped on non-empty databases' from Pavan Nambi Turso incorrectly creates the first table in an autovacuumed table in page 2. (Note: this is on collaboration with @LeMikaelF) SQLite does not allow enabling or disabling auto-vacuum after the first table has been created (https://sqlite.org/pragma.html#pragma_auto_vacuum). This is because the sequence of the pages in the databases is different when auto-vacuum is enabled, because the first b-tree page must be page 3 instead of 2, to make room for the first [Pointer Map page](https://sqlite.org/fileformat.html#pointer_map_or_ptrmap_pages). But Turso doesn't currently consider this, which can lead to data loss. The simplest way to reproduce this is to create an autovacuumed databases with either `pragma auto_vacuum=full` so that autovacuum runs on each commit, and then create a table with some data. Turso will incorrectly create the new table on page 2. After this, every time a new page is created, either through a page split or because a new table is created, Turso will write a 5-byte pointer in page 2, starting from the top of the page, thereby overwriting existing data. For example, let's start with a clean database and the first bytes of page 2. It starts with `0d`, the discriminator for a leaf page ([source](https://www.sqlite.org/fileformat.html#b_tree_pages)). The next interesting number is the number of cells contained in this page (`01`) at offset 5. ``` $ cargo run -- /tmp/a.db turso> create table t(a); turso> insert into t values ('myvalue'); $ dbtotxt /tmp/a.db \| size 8192 pagesize 4096 filename a.db \| page 1 offset 0 # ...snip... \| page 2 offset 4096 \| 0: 0d 00 00 00 01 0f f5 00 0f f5 00 00 00 00 00 00 ................ \| 4080: 00 00 00 00 00 09 01 02 1b 6d 79 76 61 6c 75 65 .........myvalue \| end a.db ``` Pointer map pages are located every N pages, starting from page 2, and contain a list of 5-byte pointers that represent the parent page of a certain page. So whenever Turso or SQLite needs to add a page, it will overwrite 5 bytes of page 2. This means that for data loss to occur, it is sufficient to add a single page to the database, for example by creating a table. Offset 5 will then be zeroed out: ``` $ cargo run -- /tmp/a.db turso> create table t(a); turso> insert into t values ('myvalue'); turso> pragma auto_vacuum=full; turso> create table tt(a); $ dbtotxt /tmp/a.db \| size 12288 pagesize 4096 filename a.db \| page 1 offset 0 # ...snip... \| page 2 offset 4096 \| 0: 01 00 00 00 00 0f f5 00 0f f5 00 00 00 00 00 00 ................ \| 4080: 00 00 00 00 00 09 01 02 1b 6d 79 76 61 6c 75 65 .........myvalue ``` Creating more tables, or adding more B-tree pages, will keep overwriting the rest of the page, until the cells themselves are also overwritten. ## Reproducing the issue in the simulator We have been unable to reproduce this exact corruption mode in the simulator, but patching it shows many failure modes, all of which don't occur with the unpatched simulator. The following seeds are failing. The following seeds are showing the issue when the patched simulator is ran against `main`: - `11522841279124073062`, with "Assertion 'table inquisitive_graham_159 should contain all of its expected values' failed: table inquisitive_graham_159 does not contain the expected values, the simulator model has more rows than the database" - `7057400018220918989`, `16028085350691325843`, `7721542713659053944`, and `203017821863546118`, with "Failed to read ptrmap key=XXX" - `12533694709304969540`, `18357088553315413457`, `3108945730906932377`, with "Integrity Check Failed: Cell N in page 2 is out of range." - `4757352625344646473`, with "dirty pages should be empty for read txn" - `7083498604824302257`, with "header_size: 6272, header_len_bytes: 2, payload.len(): 13" - `17881876827470741581`, with "ParseError("no such table: focused_historians_416")" - `2092231500503735693`, with "range end index 4789 out of range for slice of length 4096" - `7555257419378470845`, with malformed database schema (imaginative_ontivero\u{1})" - `12905270229511147245`, with "index out of bounds: the len is 4096 but the index is 4096" ## Fixing the issue - When DB is opened, we read the `auto_vacuum` state, instead of assuming `auto_vacuum=none`. - Don't allow auto_vacuum to be flipped on non-empty databases as if we allow this it could cause overlap with existing bits.(ptrmap could overwrite existing data) - Modify integrity check to avoid reporting that page 2 is orphaned in auto-vacuumed databases. Fixes #3752 Closes #3830	2025-10-28 14:48:35 +02:00
Jussi Saurio	4e48e1ffad	Make an exception for Expr::SubqueryResult in collect_result_columns()	2025-10-28 13:11:12 +02:00
Jussi Saurio	c80cf2831d	Support subqueries in all positions of a SELECT statement	2025-10-28 13:11:12 +02:00
Jussi Saurio	49ee5529cb	Evaluate uncorrelated subqueries as early as possible even LIMIT can reference an uncorrelated subquery, so we need to translate them before we do anything with LIMIT.	2025-10-28 13:11:11 +02:00
Jussi Saurio	3294b78051	Initialize LIMIT after after ORDER BY / GROUP BY initialization Currently LIMIT 0 jumps to "after the main loop", and it is done before ORDER BY and GROUP BY cursor have had a chance to be initialized, which causes a panic. Simplest fix for now is to delay the LIMIT initialization.	2025-10-28 13:08:05 +02:00
Nikita Sivukhin	0da3b4bfd3	fix after rebase	2025-10-28 11:27:35 +04:00
Nikita Sivukhin	bec295f2c0	fix clippy	2025-10-28 11:27:35 +04:00
Nikita Sivukhin	8ea733f917	fix bug with cursor allocation	2025-10-28 11:27:35 +04:00
Nikita Sivukhin	8acbe3de66	make query_start method to return bool - if result will have some rows or not	2025-10-28 11:27:35 +04:00
Nikita Sivukhin	e42ce24534	fix fmt	2025-10-28 11:27:35 +04:00
Nikita Sivukhin	67c1855ba8	fix bug	2025-10-28 11:27:35 +04:00
Nikita Sivukhin	6206294584	fix clippy	2025-10-28 11:27:35 +04:00
Nikita Sivukhin	180713d32a	plug IndexMethod into optimizer	2025-10-28 11:27:35 +04:00
Nikita Sivukhin	d6972a9cf3	fix explain	2025-10-28 11:27:35 +04:00
Nikita Sivukhin	56796151bc	support necessary helpers	2025-10-28 11:27:35 +04:00
Nikita Sivukhin	212bcfe08f	integrate IndexMethod into select main loop	2025-10-28 11:27:35 +04:00
Nikita Sivukhin	61c9279a57	properly translate column which was covered by index method	2025-10-28 11:27:35 +04:00
Nikita Sivukhin	d9ea3be4b8	forbid usage of IndexMethod in insert/delete loops	2025-10-28 11:27:35 +04:00
Nikita Sivukhin	d65b7eddc0	add helper for simple binding of values in the AST	2025-10-28 11:27:35 +04:00
Nikita Sivukhin	35b96ae8d8	fix few places which needs to be hooked into new types	2025-10-28 11:27:35 +04:00

1 2 3 4 5 ...

5974 Commits