mychen76 commited on
Commit
96cb768
1 Parent(s): 06972a3

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +143 -1
README.md CHANGED
@@ -13,7 +13,83 @@ base_model: unsloth/mistral-7b-instruct-v0.2-bnb-4bit
13
  ## Format
14
  - chatml
15
 
16
- prompt=f"""<|im_start|>system
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
17
  You are POS receipt data expert, parse, detect, recognize and convert following receipt OCR image result into structure receipt data object.
18
  Don't make up value not in the Input. Output must be a well-formed JSON object.```json<|im_end|>
19
  <|im_start|>user
@@ -21,6 +97,72 @@ Don't make up value not in the Input. Output must be a well-formed JSON object.`
21
  <|im_start|>assistant
22
  """
23
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
24
  # Uploaded model
25
 
26
  - **Developed by:** mychen76
 
13
  ## Format
14
  - chatml
15
 
16
+ receipt_boxes from Paddle-OCR
17
+ ```
18
+ ocr boxes:
19
+
20
+ [
21
+ [[[188.0, 54.0], [453.0, 54.0], [453.0, 85.0], [188.0, 85.0]], ('The Lone Pine', 0.9998102188110352)],
22
+ [[[194.0, 96.0], [449.0, 98.0], [449.0, 122.0], [194.0, 120.0]], ('43 Manchester Road', 0.9988968372344971)],
23
+ [[[228.0, 127.0], [416.0, 130.0], [416.0, 154.0], [228.0, 151.0]], ('12480 Brisbane', 0.9658010601997375)],
24
+ [[[267.0, 162.0], [375.0, 162.0], [375.0, 186.0], [267.0, 186.0]], ('Australia', 0.9997145533561707)],
25
+ [[[234.0, 193.0], [409.0, 193.0], [409.0, 216.0], [234.0, 216.0]], ('617-3236-6207', 0.9996874332427979)],
26
+ [[[46.0, 255.0], [308.0, 255.0], [308.0, 278.0], [46.0, 278.0]], ('Invoice 08000008', 0.9919923543930054)],
27
+ [[[466.0, 255.0], [598.0, 255.0], [598.0, 278.0], [466.0, 278.0]], ('09/04/08', 0.9994747042655945)],
28
+ [[[42.0, 283.0], [132.0, 283.0], [132.0, 311.0], [42.0, 311.0]], ('Table', 0.9969210624694824)],
29
+ [[[174.0, 283.0], [214.0, 283.0], [214.0, 311.0], [174.0, 311.0]], ('25', 0.9997891783714294)],
30
+ [[[514.0, 284.0], [601.0, 284.0], [601.0, 311.0], [514.0, 311.0]], ('12:45', 0.9964954257011414)],
31
+ [[[67.0, 346.0], [291.0, 349.0], [291.0, 376.0], [67.0, 374.0]], ('2 Carlsberg Bottle', 0.9987921118736267)],
32
+ [[[515.0, 346.0], [599.0, 346.0], [599.0, 372.0], [515.0, 372.0]], ('16.00', 0.9999278783798218)],
33
+ [
34
+ [[69.0, 385.0], [395.0, 387.0], [395.0, 411.0], [69.0, 409.0]],
35
+ ('3 Heineken Draft Standard.', 0.9832896590232849)
36
+ ],
37
+ [[[515.0, 384.0], [599.0, 384.0], [599.0, 409.0], [515.0, 409.0]], ('24.60', 0.9998160600662231)],
38
+ [
39
+ [[71.0, 423.0], [391.0, 423.0], [391.0, 446.0], [71.0, 446.0]],
40
+ ('1 Heineken Draft Half Liter.', 0.9641079306602478)
41
+ ],
42
+ [[[515.0, 421.0], [601.0, 421.0], [601.0, 450.0], [515.0, 450.0]], ('15.20', 0.9998868703842163)],
43
+ [
44
+ [[69.0, 460.0], [430.0, 461.0], [430.0, 485.0], [69.0, 484.0]],
45
+ ('2 Carlsberg Bucket (5 bottles).', 0.974445641040802)
46
+ ],
47
+ [[[515.0, 461.0], [599.0, 461.0], [599.0, 486.0], [515.0, 486.0]], ('80.00', 0.9999423027038574)],
48
+ [
49
+ [[69.0, 498.0], [367.0, 500.0], [367.0, 524.0], [69.0, 522.0]],
50
+ ('4 Grilled Chicken Breast.', 0.9773013591766357)
51
+ ],
52
+ [[[515.0, 499.0], [599.0, 499.0], [599.0, 524.0], [515.0, 524.0]], ('74.00', 0.9999669194221497)],
53
+ [[[68.0, 534.0], [250.0, 537.0], [250.0, 562.0], [68.0, 560.0]], ('3 Sirloin Steak', 0.9997309446334839)],
54
+ [[[515.0, 537.0], [599.0, 537.0], [599.0, 561.0], [515.0, 561.0]], ('96.00', 0.9999544024467468)],
55
+ [[[67.0, 571.0], [162.0, 574.0], [161.0, 601.0], [67.0, 598.0]], ('1 Coke', 0.9997830390930176)],
56
+ [[[530.0, 572.0], [602.0, 572.0], [602.0, 601.0], [530.0, 601.0]], ('3.50', 0.9999455213546753)],
57
+ [[[69.0, 609.0], [219.0, 613.0], [218.0, 638.0], [68.0, 634.0]], ('5 Ice Cream', 0.9914276003837585)],
58
+ [[[516.0, 611.0], [599.0, 611.0], [599.0, 637.0], [516.0, 637.0]], ('18.00', 0.9999335408210754)],
59
+ [[[154.0, 664.0], [288.0, 664.0], [288.0, 688.0], [154.0, 688.0]], ('Subtotal', 0.9990750551223755)],
60
+ [[[499.0, 664.0], [599.0, 664.0], [599.0, 688.0], [499.0, 688.0]], ('327.30', 0.9999768137931824)],
61
+ [
62
+ [[155.0, 701.0], [397.0, 701.0], [397.0, 724.0], [155.0, 724.0]],
63
+ ('Sales/Gov Tax - 5%', 0.9552016854286194)
64
+ ],
65
+ [[[514.0, 697.0], [601.0, 697.0], [601.0, 724.0], [514.0, 724.0]], ('16.36', 0.999823272228241)],
66
+ [
67
+ [[155.0, 733.0], [419.0, 733.0], [419.0, 757.0], [155.0, 757.0]],
68
+ ('Service Charge - 10%', 0.9921379089355469)
69
+ ],
70
+ [[[512.0, 728.0], [601.0, 731.0], [600.0, 759.0], [511.0, 757.0]], ('32.73', 0.9999620318412781)],
71
+ [[[154.0, 775.0], [335.0, 775.0], [335.0, 799.0], [154.0, 799.0]], ('GRAND TOTAL', 0.9899482131004333)],
72
+ [[[499.0, 778.0], [599.0, 778.0], [599.0, 802.0], [499.0, 802.0]], ('376.40', 0.9999797940254211)],
73
+ [[[39.0, 831.0], [223.0, 831.0], [223.0, 859.0], [39.0, 859.0]], ('Thank you and', 0.9922393560409546)],
74
+ [[[336.0, 831.0], [407.0, 831.0], [407.0, 860.0], [336.0, 860.0]], ('Cash', 0.9998616576194763)],
75
+ [[[499.0, 831.0], [601.0, 831.0], [601.0, 859.0], [499.0, 859.0]], ('400.00', 0.9998554587364197)],
76
+ [[[38.0, 866.0], [220.0, 862.0], [220.0, 891.0], [38.0, 895.0]], ('see you again!', 0.9798372983932495)],
77
+ [[[336.0, 864.0], [438.0, 869.0], [437.0, 898.0], [335.0, 894.0]], ('Change', 0.9998979568481445)],
78
+ [[[515.0, 867.0], [599.0, 867.0], [599.0, 892.0], [515.0, 892.0]], ('23.60', 0.9999337196350098)],
79
+ [[[37.0, 901.0], [108.0, 901.0], [108.0, 930.0], [37.0, 930.0]], ('John', 0.9990785717964172)],
80
+ [
81
+ [[73.0, 962.0], [569.0, 965.0], [569.0, 991.0], [73.0, 989.0]],
82
+ ('Bring this bill back within the next 10 days', 0.9880552887916565)
83
+ ],
84
+ [
85
+ [[50.0, 1000.0], [591.0, 1000.0], [591.0, 1023.0], [50.0, 1023.0]],
86
+ ("and get 15% discount on that day's food bill..", 0.9851154685020447)
87
+ ]
88
+ ]
89
+ ```
90
+
91
+ # prompt
92
+ f"""<|im_start|>system
93
  You are POS receipt data expert, parse, detect, recognize and convert following receipt OCR image result into structure receipt data object.
94
  Don't make up value not in the Input. Output must be a well-formed JSON object.```json<|im_end|>
95
  <|im_start|>user
 
97
  <|im_start|>assistant
98
  """
99
 
100
+ # Result
101
+ ```
102
+ <|im_start|>assistant
103
+ {
104
+ "store_name": "The Lone Pine",
105
+ "store_address": "43 Manchester Road",
106
+ "city": "Brisbane",
107
+ "country": "Australia",
108
+ "phone": "617-3236-6207",
109
+ "invoice_number": "08000008",
110
+ "invoice_date": "09/04/08",
111
+ "table_number": "25",
112
+ "time": "12:45",
113
+ "items": [
114
+ {
115
+ "item_name": "Carlsberg Bottle",
116
+ "quantity": "2",
117
+ "price": "16.00"
118
+ },
119
+ {
120
+ "item_name": "Heineken Draft Half Liter.",
121
+ "quantity": "1",
122
+ "price": "15.20"
123
+ },
124
+ {
125
+ "item_name": "Heineken Draft Standard.",
126
+ "quantity": "3",
127
+ "price": "12.00"
128
+ },
129
+ {
130
+ "item_name": "Sirloin Steak",
131
+ "quantity": "3",
132
+ "price": "96.00"
133
+ },
134
+ {
135
+ "item_name": "Grilled Chicken Breast",
136
+ "quantity": "4",
137
+ "price": "74.00"
138
+ },
139
+ {
140
+ "item_name": "Coke",
141
+ "quantity": "1",
142
+ "price": "3.50"
143
+ },
144
+ {
145
+ "item_name": "Ice Cream",
146
+ "quantity": "5",
147
+ "price": "18.00"
148
+ }
149
+ ],
150
+ "subtotal": "327.30",
151
+ "tax": "16.36",
152
+ "service_charge": "32.73",
153
+ "total": "376.40",
154
+ "payment": {
155
+ "cash": "400.00",
156
+ "change": "23.60"
157
+ },
158
+ "customer": {
159
+ "name": "John"
160
+ },
161
+ "discount": "15%"
162
+ }<|im_end|></s>
163
+ ```
164
+
165
+
166
  # Uploaded model
167
 
168
  - **Developed by:** mychen76