Update README.md
Browse files
README.md
CHANGED
|
@@ -13,7 +13,83 @@ base_model: unsloth/mistral-7b-instruct-v0.2-bnb-4bit
|
|
| 13 |
## Format
|
| 14 |
- chatml
|
| 15 |
|
| 16 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 17 |
You are POS receipt data expert, parse, detect, recognize and convert following receipt OCR image result into structure receipt data object.
|
| 18 |
Don't make up value not in the Input. Output must be a well-formed JSON object.```json<|im_end|>
|
| 19 |
<|im_start|>user
|
|
@@ -21,6 +97,72 @@ Don't make up value not in the Input. Output must be a well-formed JSON object.`
|
|
| 21 |
<|im_start|>assistant
|
| 22 |
"""
|
| 23 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 24 |
# Uploaded model
|
| 25 |
|
| 26 |
- **Developed by:** mychen76
|
|
|
|
| 13 |
## Format
|
| 14 |
- chatml
|
| 15 |
|
| 16 |
+
receipt_boxes from Paddle-OCR
|
| 17 |
+
```
|
| 18 |
+
ocr boxes:
|
| 19 |
+
|
| 20 |
+
[
|
| 21 |
+
[[[188.0, 54.0], [453.0, 54.0], [453.0, 85.0], [188.0, 85.0]], ('The Lone Pine', 0.9998102188110352)],
|
| 22 |
+
[[[194.0, 96.0], [449.0, 98.0], [449.0, 122.0], [194.0, 120.0]], ('43 Manchester Road', 0.9988968372344971)],
|
| 23 |
+
[[[228.0, 127.0], [416.0, 130.0], [416.0, 154.0], [228.0, 151.0]], ('12480 Brisbane', 0.9658010601997375)],
|
| 24 |
+
[[[267.0, 162.0], [375.0, 162.0], [375.0, 186.0], [267.0, 186.0]], ('Australia', 0.9997145533561707)],
|
| 25 |
+
[[[234.0, 193.0], [409.0, 193.0], [409.0, 216.0], [234.0, 216.0]], ('617-3236-6207', 0.9996874332427979)],
|
| 26 |
+
[[[46.0, 255.0], [308.0, 255.0], [308.0, 278.0], [46.0, 278.0]], ('Invoice 08000008', 0.9919923543930054)],
|
| 27 |
+
[[[466.0, 255.0], [598.0, 255.0], [598.0, 278.0], [466.0, 278.0]], ('09/04/08', 0.9994747042655945)],
|
| 28 |
+
[[[42.0, 283.0], [132.0, 283.0], [132.0, 311.0], [42.0, 311.0]], ('Table', 0.9969210624694824)],
|
| 29 |
+
[[[174.0, 283.0], [214.0, 283.0], [214.0, 311.0], [174.0, 311.0]], ('25', 0.9997891783714294)],
|
| 30 |
+
[[[514.0, 284.0], [601.0, 284.0], [601.0, 311.0], [514.0, 311.0]], ('12:45', 0.9964954257011414)],
|
| 31 |
+
[[[67.0, 346.0], [291.0, 349.0], [291.0, 376.0], [67.0, 374.0]], ('2 Carlsberg Bottle', 0.9987921118736267)],
|
| 32 |
+
[[[515.0, 346.0], [599.0, 346.0], [599.0, 372.0], [515.0, 372.0]], ('16.00', 0.9999278783798218)],
|
| 33 |
+
[
|
| 34 |
+
[[69.0, 385.0], [395.0, 387.0], [395.0, 411.0], [69.0, 409.0]],
|
| 35 |
+
('3 Heineken Draft Standard.', 0.9832896590232849)
|
| 36 |
+
],
|
| 37 |
+
[[[515.0, 384.0], [599.0, 384.0], [599.0, 409.0], [515.0, 409.0]], ('24.60', 0.9998160600662231)],
|
| 38 |
+
[
|
| 39 |
+
[[71.0, 423.0], [391.0, 423.0], [391.0, 446.0], [71.0, 446.0]],
|
| 40 |
+
('1 Heineken Draft Half Liter.', 0.9641079306602478)
|
| 41 |
+
],
|
| 42 |
+
[[[515.0, 421.0], [601.0, 421.0], [601.0, 450.0], [515.0, 450.0]], ('15.20', 0.9998868703842163)],
|
| 43 |
+
[
|
| 44 |
+
[[69.0, 460.0], [430.0, 461.0], [430.0, 485.0], [69.0, 484.0]],
|
| 45 |
+
('2 Carlsberg Bucket (5 bottles).', 0.974445641040802)
|
| 46 |
+
],
|
| 47 |
+
[[[515.0, 461.0], [599.0, 461.0], [599.0, 486.0], [515.0, 486.0]], ('80.00', 0.9999423027038574)],
|
| 48 |
+
[
|
| 49 |
+
[[69.0, 498.0], [367.0, 500.0], [367.0, 524.0], [69.0, 522.0]],
|
| 50 |
+
('4 Grilled Chicken Breast.', 0.9773013591766357)
|
| 51 |
+
],
|
| 52 |
+
[[[515.0, 499.0], [599.0, 499.0], [599.0, 524.0], [515.0, 524.0]], ('74.00', 0.9999669194221497)],
|
| 53 |
+
[[[68.0, 534.0], [250.0, 537.0], [250.0, 562.0], [68.0, 560.0]], ('3 Sirloin Steak', 0.9997309446334839)],
|
| 54 |
+
[[[515.0, 537.0], [599.0, 537.0], [599.0, 561.0], [515.0, 561.0]], ('96.00', 0.9999544024467468)],
|
| 55 |
+
[[[67.0, 571.0], [162.0, 574.0], [161.0, 601.0], [67.0, 598.0]], ('1 Coke', 0.9997830390930176)],
|
| 56 |
+
[[[530.0, 572.0], [602.0, 572.0], [602.0, 601.0], [530.0, 601.0]], ('3.50', 0.9999455213546753)],
|
| 57 |
+
[[[69.0, 609.0], [219.0, 613.0], [218.0, 638.0], [68.0, 634.0]], ('5 Ice Cream', 0.9914276003837585)],
|
| 58 |
+
[[[516.0, 611.0], [599.0, 611.0], [599.0, 637.0], [516.0, 637.0]], ('18.00', 0.9999335408210754)],
|
| 59 |
+
[[[154.0, 664.0], [288.0, 664.0], [288.0, 688.0], [154.0, 688.0]], ('Subtotal', 0.9990750551223755)],
|
| 60 |
+
[[[499.0, 664.0], [599.0, 664.0], [599.0, 688.0], [499.0, 688.0]], ('327.30', 0.9999768137931824)],
|
| 61 |
+
[
|
| 62 |
+
[[155.0, 701.0], [397.0, 701.0], [397.0, 724.0], [155.0, 724.0]],
|
| 63 |
+
('Sales/Gov Tax - 5%', 0.9552016854286194)
|
| 64 |
+
],
|
| 65 |
+
[[[514.0, 697.0], [601.0, 697.0], [601.0, 724.0], [514.0, 724.0]], ('16.36', 0.999823272228241)],
|
| 66 |
+
[
|
| 67 |
+
[[155.0, 733.0], [419.0, 733.0], [419.0, 757.0], [155.0, 757.0]],
|
| 68 |
+
('Service Charge - 10%', 0.9921379089355469)
|
| 69 |
+
],
|
| 70 |
+
[[[512.0, 728.0], [601.0, 731.0], [600.0, 759.0], [511.0, 757.0]], ('32.73', 0.9999620318412781)],
|
| 71 |
+
[[[154.0, 775.0], [335.0, 775.0], [335.0, 799.0], [154.0, 799.0]], ('GRAND TOTAL', 0.9899482131004333)],
|
| 72 |
+
[[[499.0, 778.0], [599.0, 778.0], [599.0, 802.0], [499.0, 802.0]], ('376.40', 0.9999797940254211)],
|
| 73 |
+
[[[39.0, 831.0], [223.0, 831.0], [223.0, 859.0], [39.0, 859.0]], ('Thank you and', 0.9922393560409546)],
|
| 74 |
+
[[[336.0, 831.0], [407.0, 831.0], [407.0, 860.0], [336.0, 860.0]], ('Cash', 0.9998616576194763)],
|
| 75 |
+
[[[499.0, 831.0], [601.0, 831.0], [601.0, 859.0], [499.0, 859.0]], ('400.00', 0.9998554587364197)],
|
| 76 |
+
[[[38.0, 866.0], [220.0, 862.0], [220.0, 891.0], [38.0, 895.0]], ('see you again!', 0.9798372983932495)],
|
| 77 |
+
[[[336.0, 864.0], [438.0, 869.0], [437.0, 898.0], [335.0, 894.0]], ('Change', 0.9998979568481445)],
|
| 78 |
+
[[[515.0, 867.0], [599.0, 867.0], [599.0, 892.0], [515.0, 892.0]], ('23.60', 0.9999337196350098)],
|
| 79 |
+
[[[37.0, 901.0], [108.0, 901.0], [108.0, 930.0], [37.0, 930.0]], ('John', 0.9990785717964172)],
|
| 80 |
+
[
|
| 81 |
+
[[73.0, 962.0], [569.0, 965.0], [569.0, 991.0], [73.0, 989.0]],
|
| 82 |
+
('Bring this bill back within the next 10 days', 0.9880552887916565)
|
| 83 |
+
],
|
| 84 |
+
[
|
| 85 |
+
[[50.0, 1000.0], [591.0, 1000.0], [591.0, 1023.0], [50.0, 1023.0]],
|
| 86 |
+
("and get 15% discount on that day's food bill..", 0.9851154685020447)
|
| 87 |
+
]
|
| 88 |
+
]
|
| 89 |
+
```
|
| 90 |
+
|
| 91 |
+
# prompt
|
| 92 |
+
f"""<|im_start|>system
|
| 93 |
You are POS receipt data expert, parse, detect, recognize and convert following receipt OCR image result into structure receipt data object.
|
| 94 |
Don't make up value not in the Input. Output must be a well-formed JSON object.```json<|im_end|>
|
| 95 |
<|im_start|>user
|
|
|
|
| 97 |
<|im_start|>assistant
|
| 98 |
"""
|
| 99 |
|
| 100 |
+
# Result
|
| 101 |
+
```
|
| 102 |
+
<|im_start|>assistant
|
| 103 |
+
{
|
| 104 |
+
"store_name": "The Lone Pine",
|
| 105 |
+
"store_address": "43 Manchester Road",
|
| 106 |
+
"city": "Brisbane",
|
| 107 |
+
"country": "Australia",
|
| 108 |
+
"phone": "617-3236-6207",
|
| 109 |
+
"invoice_number": "08000008",
|
| 110 |
+
"invoice_date": "09/04/08",
|
| 111 |
+
"table_number": "25",
|
| 112 |
+
"time": "12:45",
|
| 113 |
+
"items": [
|
| 114 |
+
{
|
| 115 |
+
"item_name": "Carlsberg Bottle",
|
| 116 |
+
"quantity": "2",
|
| 117 |
+
"price": "16.00"
|
| 118 |
+
},
|
| 119 |
+
{
|
| 120 |
+
"item_name": "Heineken Draft Half Liter.",
|
| 121 |
+
"quantity": "1",
|
| 122 |
+
"price": "15.20"
|
| 123 |
+
},
|
| 124 |
+
{
|
| 125 |
+
"item_name": "Heineken Draft Standard.",
|
| 126 |
+
"quantity": "3",
|
| 127 |
+
"price": "12.00"
|
| 128 |
+
},
|
| 129 |
+
{
|
| 130 |
+
"item_name": "Sirloin Steak",
|
| 131 |
+
"quantity": "3",
|
| 132 |
+
"price": "96.00"
|
| 133 |
+
},
|
| 134 |
+
{
|
| 135 |
+
"item_name": "Grilled Chicken Breast",
|
| 136 |
+
"quantity": "4",
|
| 137 |
+
"price": "74.00"
|
| 138 |
+
},
|
| 139 |
+
{
|
| 140 |
+
"item_name": "Coke",
|
| 141 |
+
"quantity": "1",
|
| 142 |
+
"price": "3.50"
|
| 143 |
+
},
|
| 144 |
+
{
|
| 145 |
+
"item_name": "Ice Cream",
|
| 146 |
+
"quantity": "5",
|
| 147 |
+
"price": "18.00"
|
| 148 |
+
}
|
| 149 |
+
],
|
| 150 |
+
"subtotal": "327.30",
|
| 151 |
+
"tax": "16.36",
|
| 152 |
+
"service_charge": "32.73",
|
| 153 |
+
"total": "376.40",
|
| 154 |
+
"payment": {
|
| 155 |
+
"cash": "400.00",
|
| 156 |
+
"change": "23.60"
|
| 157 |
+
},
|
| 158 |
+
"customer": {
|
| 159 |
+
"name": "John"
|
| 160 |
+
},
|
| 161 |
+
"discount": "15%"
|
| 162 |
+
}<|im_end|></s>
|
| 163 |
+
```
|
| 164 |
+
|
| 165 |
+
|
| 166 |
# Uploaded model
|
| 167 |
|
| 168 |
- **Developed by:** mychen76
|