JacksonLark
commited on
Commit
•
dd58119
1
Parent(s):
ea72c6c
Update README.md
Browse files
README.md
CHANGED
@@ -30,4 +30,19 @@ inputs = tokenizer.encode(text, return_tensors="pt").to(device)
|
|
30 |
output_ids = model.generate(inputs, max_length=512)
|
31 |
response_text = self.tokenizer.decode(outputs[0], skip_special_tokens=True)
|
32 |
# SELECT COUNT( * ) FROM track
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
33 |
```
|
|
|
30 |
output_ids = model.generate(inputs, max_length=512)
|
31 |
response_text = self.tokenizer.decode(outputs[0], skip_special_tokens=True)
|
32 |
# SELECT COUNT( * ) FROM track
|
33 |
+
```
|
34 |
+
|
35 |
+
# How to Train
|
36 |
+
|
37 |
+
Dataset:
|
38 |
+
- https://huggingface.co/datasets/laion/OIG#unified_sqlv1jsonl-17000
|
39 |
+
- https://huggingface.co/datasets/laion/OIG#unified_sqlv2jsonl24000
|
40 |
+
|
41 |
+
```json
|
42 |
+
{
|
43 |
+
"text":"<human>: Given the following schema:\nlocation (restaurant_id, house_number, street_name, city_name)\nrestaurant (id, name, food_type, city_name, rating)\ngeographic (city_name, county, region)\nWrite a SQL query to give me some good arabic -s on buchanan in san francisco ?\n<bot>: SELECT location.house_number , restaurant.name FROM location , restaurant WHERE location.city_name = \"san francisco\" AND location.street_name = \"buchanan\" AND restaurant.food_type = \"arabic\" AND restaurant.id = location.restaurant_id AND restaurant.rating > 2.5 ;",
|
44 |
+
"metadata":{
|
45 |
+
"source":"unified_sqlv1"
|
46 |
+
}
|
47 |
+
}
|
48 |
```
|