JacksonLark commited on
Commit
dd58119
1 Parent(s): ea72c6c

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +15 -0
README.md CHANGED
@@ -30,4 +30,19 @@ inputs = tokenizer.encode(text, return_tensors="pt").to(device)
30
  output_ids = model.generate(inputs, max_length=512)
31
  response_text = self.tokenizer.decode(outputs[0], skip_special_tokens=True)
32
  # SELECT COUNT( * ) FROM track
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  ```
 
30
  output_ids = model.generate(inputs, max_length=512)
31
  response_text = self.tokenizer.decode(outputs[0], skip_special_tokens=True)
32
  # SELECT COUNT( * ) FROM track
33
+ ```
34
+
35
+ # How to Train
36
+
37
+ Dataset:
38
+ - https://huggingface.co/datasets/laion/OIG#unified_sqlv1jsonl-17000
39
+ - https://huggingface.co/datasets/laion/OIG#unified_sqlv2jsonl24000
40
+
41
+ ```json
42
+ {
43
+ "text":"<human>: Given the following schema:\nlocation (restaurant_id, house_number, street_name, city_name)\nrestaurant (id, name, food_type, city_name, rating)\ngeographic (city_name, county, region)\nWrite a SQL query to give me some good arabic -s on buchanan in san francisco ?\n<bot>: SELECT location.house_number , restaurant.name FROM location , restaurant WHERE location.city_name = \"san francisco\" AND location.street_name = \"buchanan\" AND restaurant.food_type = \"arabic\" AND restaurant.id = location.restaurant_id AND restaurant.rating > 2.5 ;",
44
+ "metadata":{
45
+ "source":"unified_sqlv1"
46
+ }
47
+ }
48
  ```