Skip to content

Commit 0e54131

Browse files
authored
Tokenizer (#92)
1 parent 59bf008 commit 0e54131

24 files changed

+626
-76
lines changed

.gitignore

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -5,3 +5,4 @@ data/sort_by_*
55
data/sorted_by_*
66
src/rust/target/
77
__pycache__/
8+
**/.mypy_cache/

data/sql_input_2.sql

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,8 +14,9 @@ VALUES ('San Francisco', 852469, -8);
1414
INSERT INTO city (name, population, timezone)
1515
VALUES ('New York', 8405837, -5);
1616

17-
SELECT
17+
SELECT (
1818
name,
1919
population,
2020
timezone
21+
)
2122
FROM city;

data/sql_input_3.sql

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,8 +14,9 @@ VALUES ('San Francisco', -8);
1414
INSERT INTO city (name, population)
1515
VALUES ('New York', 8405837);
1616

17-
SELECT
17+
SELECT (
1818
name,
1919
population,
2020
timezone
21+
)
2122
FROM city;

data/tokenizer_input_0.sql

Lines changed: 22 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,22 @@
1+
CREATE TABLE town ();
2+
3+
CREATE TABLE city (
4+
name VARCHAR,
5+
population INT,
6+
timezone INT
7+
);
8+
9+
INSERT INTO city (name, population, timezone)
10+
VALUES ('San Francisco', 852469, -8);
11+
12+
INSERT INTO city (name, population)
13+
VALUES ('New York', 8405837);
14+
15+
SELECT (
16+
name,
17+
population,
18+
timezone
19+
)
20+
FROM city;
21+
22+
SELECT name FROM city;

data/tokenizer_input_1.sql

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
CREATE TABLE town ();

data/tokenizer_input_2.sql

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
SELECT name FROM city;

data/tokenizer_input_3.sql

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,2 @@
1+
INSERT INTO city (name, population, timezone)
2+
VALUES ('San Francisco', 852469, -8);

data/tokenizer_input_4.sql

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,2 @@
1+
INSERT INTO items (type)
2+
VALUES ('"d"r"u"g"s"');

data/tokenizer_input_5.sql

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
SELECT (
2+
name,
3+
population,
4+
timezone
5+
)
6+
FROM city;

data/tokenizer_input_6.sql

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,5 @@
1+
CREATE TABLE city (
2+
name VARCHAR,
3+
population INT,
4+
timezone INT
5+
);

0 commit comments

Comments
 (0)