Skip to content

Commit f92933b

Browse files
Eval driven system design cookbook (#1875)
1 parent e5aac77 commit f92933b

File tree

262 files changed

+2592
-0
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

262 files changed

+2592
-0
lines changed
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": false,
3+
"amount_over_limit": false,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "1. The receipt is for gas (E-85 fuel), which is a travel-related expense. Therefore, NOT_TRAVEL_RELATED is FALSE. \n2. The total amount of the receipt is $36.16, which does not exceed $50. Therefore, AMOUNT_OVER_LIMIT is FALSE. \n3. The subtotal of $36.16 matches the total of $36.16, indicating no math errors. Therefore, MATH_ERROR is FALSE. \n4. The handwritten notes do not contain an 'X'. Therefore, HANDWRITTEN_X is FALSE.",
7+
"needs_audit": false
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": false,
3+
"amount_over_limit": false,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "The receipt is for gasoline, which is considered a travel-related expense, so it does not meet the NOT_TRAVEL_RELATED criterion. The total amount is $49.61, which is below the $50 limit, so the AMOUNT_OVER_LIMIT criterion is not violated. There are no discrepancies in the math for computing the total, confirming that MATH_ERROR is false. There is no 'X' present in the handwritten notes, meaning HANDWRITTEN_X is also false. Since none of the criteria are violated, the receipt does not need auditing.",
7+
"needs_audit": false
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": false,
3+
"amount_over_limit": true,
4+
"math_error": false,
5+
"handwritten_x": true,
6+
"reasoning": "The receipt is for fuel, which is classified as a travel-related expense, hence it does not satisfy the NOT_TRAVEL_RELATED criterion. The total amount of $60.91 exceeds the $50 limit, thus satisfying the AMOUNT_OVER_LIMIT criterion. There are no discrepancies in the arithmetic calculations for the total, so MATH_ERROR is false. However, there is a handwritten 'X' noted in the handwritten notes, which satisfies the HANDWRITTEN_X criterion. 1. NOT_TRAVEL_RELATED: This is a fuel purchase (travel-related), so not_travel_related=false. 2. AMOUNT_OVER_LIMIT: Total of $60.91 exceeds $50, so amount_over_limit=true. 3. MATH_ERROR: 4.199×14.5076≈60.9174, which rounds up to $60.92 or truncates to $60.91, the listed total (either would be acceptable), so math_error=false. 4. HANDWRITTEN_X: The note 'X' is written on the the receipt, so handwritten_x=true. At least one criterion is violated, so needs_audit=true.",
7+
"needs_audit": true
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": false,
3+
"amount_over_limit": true,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "The receipt is for fuel, which is considered travel-related, hence NOT_TRAVEL_RELATED is FALSE. The total amount of the receipt is $72.10, which exceeds the $50 limit making AMOUNT_OVER_LIMIT TRUE. The math adds up correctly as the subtotal matches the total, so MATH_ERROR is FALSE. There are no handwritten 'X's in the notes so HANDWRITTEN_X is FALSE. Since one of the criteria (AMOUNT_OVER_LIMIT) is violated, the receipt needs auditing.",
7+
"needs_audit": true
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": true,
3+
"amount_over_limit": true,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "1. NOT_TRAVEL_RELATED: The receipt is for home goods and cleaning supplies, which are not travel-related expenses. Therefore, this criterion is TRUE.\n\n2. AMOUNT_OVER_LIMIT: The total of the receipt is $273.52, which is over the $50 limit, making this criterion TRUE.\n\n3. MATH_ERROR: The subtotal adds up correctly when calculated with tax. The subtotal $252.67 plus tax $20.85 equals the total $273.52. Thus, there is no math error, and this is FALSE.\n\n4. HANDWRITTEN_X: There is no 'X' in the handwritten notes provided. Thus, this is FALSE.\n\nSince two of the criteria (AMOUNT_OVER_LIMIT and MATH_ERROR) are TRUE, the final determination is that this receipt needs to be audited.",
7+
"needs_audit": true
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": false,
3+
"amount_over_limit": false,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "1. NOT_TRAVEL_RELATED: The receipt includes fuel as a purchase which is considered travel-related, therefore this criterion is FALSE.\n2. AMOUNT_OVER_LIMIT: The total amount is $49.54, which does not exceed $50, so this is FALSE.\n3. MATH_ERROR: The line item for fuel ($49.54) matches the total provided ($49.54), hence there is no math error, making this FALSE.\n4. HANDWRITTEN_X: There is no 'X' in the handwritten notes, so this is FALSE. \nSince none of the criteria are violated, the receipt does not need an audit.",
7+
"needs_audit": false
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": false,
3+
"amount_over_limit": true,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "The expenses are for fuel, which is a travel-related cost, so the criterion for being 'not travel-related' is FALSE. The total amount of the receipt is $60.94, which exceeds the $50 limit, making the 'Amount Over Limit' criterion TRUE. There are no discrepancies in the math as the total matches the sum of the item prices, and there is no 'X' in the handwritten notes. Since one of the criteria (Amount Over Limit) is violated, the receipt needs to be audited.",
7+
"needs_audit": true
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": false,
3+
"amount_over_limit": false,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "1. NOT_TRAVEL_RELATED: The receipt is for fuel, which is considered a travel-related expense, so this is FALSE. 2. AMOUNT_OVER_LIMIT: The total amount is $41.46, which does not exceed $50, so this is FALSE. 3. MATH_ERROR: The total of the line item ($41.46) matches the total provided, so this is FALSE. 4. HANDWRITTEN_X: There is no 'X' in the handwritten notes, so this is FALSE. Since none of the criteria are violated, the receipt does not need auditing.",
7+
"needs_audit": false
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": false,
3+
"amount_over_limit": false,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "1. NOT_TRAVEL_RELATED: The receipt is from Shell Gasoline and includes fuel expenses, making it travel-related. Therefore, this criterion is FALSE. 2. AMOUNT_OVER_LIMIT: The total amount of $38.26 is below the $50 threshold, so this criterion is FALSE. 3. MATH_ERROR: The line item for fuel ($38.26) matches the computed total, indicating no math errors, so this criterion is FALSE. 4. HANDWRITTEN_X: There is no 'X' present in the handwritten notes on the receipt, making this criterion FALSE. Since all criteria are not violated (all FALSE), the receipt does not need auditing.",
7+
"needs_audit": false
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": false,
3+
"amount_over_limit": true,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "The receipt is for 'Unleaded' fuel from a gas station, which is a travel-related expense, thus the NOT_TRAVEL_RELATED criterion is FALSE. The total amount of the receipt is $62.68, exceeding the $50 limit, making AMOUNT_OVER_LIMIT TRUE. There are no discrepancies in the math calculations presented, hence MATH_ERROR is FALSE. There is no 'X' noted in the handwritten notes, so HANDWRITTEN_X is FALSE. Since the AMOUNT_OVER_LIMIT criteria is violated, the receipt needs auditing.",
7+
"needs_audit": true
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": false,
3+
"amount_over_limit": false,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "1. NOT_TRAVEL_RELATED: The receipt is from 'Shell Gasoline' for fuel (E85), which is a travel-related expense. Therefore, this criterion is not violated (FALSE). \n2. AMOUNT_OVER_LIMIT: The total amount on the receipt is $40.19, which does not exceed the $50 limit. This criterion is not violated (FALSE). \n3. MATH_ERROR: The total of the item listed ($40.19) matches the provided total; hence, there are no math errors. This criterion is not violated (FALSE). \n4. HANDWRITTEN_X: There is no 'X' noted in the handwritten notes. This criterion is not violated (FALSE). \n\nSince no criteria were violated, the receipt does not need auditing.",
7+
"needs_audit": false
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": false,
3+
"amount_over_limit": false,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "1. Not Travel Related: The receipt is for fuel, which is a travel-related expense, thus this criterion is FALSE.\n2. Amount Over Limit: The total amount of $47.06 does not exceed $50, so this criterion is FALSE.\n3. Math Error: The total amount ($47.06) matches the calculated total from the line item (3.859 * 12.195 = 47.06), so there is no math error, making this criterion FALSE.\n4. Handwritten X: There are no 'X's noted in the handwritten notes, hence this criterion is FALSE.\nSince none of the criteria are violated, the receipt does not need auditing.",
7+
"needs_audit": false
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": true,
3+
"amount_over_limit": false,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "1. NOT_TRAVEL_RELATED: The receipt is for stationery items, so it is not a travel-related expense (TRUE). \n\n2. AMOUNT_OVER_LIMIT: The total amount is $8.68, which does not exceed $50 (FALSE). \n\n3. MATH_ERROR: The subtotal of $7.98 plus tax of $0.70 correctly sums up to a total of $8.68 (FALSE). \n\n4. HANDWRITTEN_X: There is no 'X' present in the handwritten notes (FALSE). \n\nSince NOT_TRAVEL_RELATED is true the receipt requires auditing.",
7+
"needs_audit": true
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": true,
3+
"amount_over_limit": false,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "The receipt is for household and grocery items (Airwick, pantry goods) and contains no travel-related expense (e.g., gas, hotel, airfare). The total $40.69 does not exceed $50. The line items sum correctly to the subtotal and total (15.48 + 17.48 + 4.98 + 2.75 tax = 40.69). There are no handwritten notes or an “X.” Because the expense is not travel-related, the receipt requires auditing.",
7+
"needs_audit": true
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": false,
3+
"amount_over_limit": false,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "1. NOT_TRAVEL_RELATED: The receipt is for Fuel, which is a travel-related expense, so this criterion is FALSE. 2. AMOUNT_OVER_LIMIT: The total amount is $31.58, which does not exceed $50, so this criterion is FALSE. 3. MATH_ERROR: The total matches the sum of the line items ($31.58), so there is no math error, this criterion is FALSE. 4. HANDWRITTEN_X: There is no 'X' in the handwritten notes, so this criterion is FALSE.",
7+
"needs_audit": false
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": false,
3+
"amount_over_limit": true,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "1. NOT_TRAVEL_RELATED: The receipt is for fuel, which is considered a travel-related expense, thus this criterion is FALSE. 2. AMOUNT_OVER_LIMIT: The total amount of $63.13 exceeds the limit of $50, so this criterion is TRUE. 3. MATH_ERROR: The subtotal and total match, indicating there are no math errors, thus this criterion is FALSE. 4. HANDWRITTEN_X: There is no 'X' in the handwritten notes, making this criterion FALSE.",
7+
"needs_audit": true
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": false,
3+
"amount_over_limit": false,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "1. NOT_TRAVEL_RELATED: The receipt is for fuel (Regular Unleaded), which is a travel-related expense, so this is FALSE.\n2. AMOUNT_OVER_LIMIT: The total amount is $45.25, which does not exceed $50, so this is FALSE.\n3. MATH_ERROR: The subtotal, tax, and total correctly add up to $45.25 with no discrepancies, so this is FALSE.\n4. HANDWRITTEN_X: There are no handwritten 'X's present in the notes, so this is FALSE.",
7+
"needs_audit": false
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": false,
3+
"amount_over_limit": false,
4+
"math_error": false,
5+
"handwritten_x": true,
6+
"reasoning": "The receipt is for fuel, which is a travel-related expense, hence NOT_TRAVEL_RELATED is false. The total amount of $32.00 is below the $50 limit, so AMOUNT_OVER_LIMIT is false. There are no math errors as the calculated total matches the receipt total, so MATH_ERROR is false. However, there is an 'X' present in the handwritten notes, making HANDWRITTEN_X true. Since HANDWRITTEN_X is violated, the receipt needs auditing.",
7+
"needs_audit": true
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": false,
3+
"amount_over_limit": false,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "The receipt from O'Reilly Auto Parts is for an automotive item (SNOWBROOM). A snow broom could be required to for safe driving in snowy conditions, so this is plausibly a valid travel-related expense, so NOT_TRAVEL_RELATED is false. The total amount of the receipt is $35.55, which does not exceed the $50 limit, thus AMOUNT_OVER_LIMIT is false. There are no discrepancies in the math as the subtotal plus tax equals the total, so MATH_ERROR is false. The handwritten notes section is empty, therefore HANDWRITTEN_X is false.",
7+
"needs_audit": false
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"not_travel_related": true,
3+
"amount_over_limit": false,
4+
"math_error": false,
5+
"handwritten_x": false,
6+
"reasoning": "The receipt is for tools purchased at The Home Depot, which are NOT travel-related expenses, so NOT_TRAVEL_RELATED is true. The total amount of $43.54 does not exceed $50, so AMOUNT_OVER_LIMIT is false. All line items sum correctly to the total, and there are no handwritten notes indicating an 'X', so HANDWRITTEN_X is false. Since NOT_TRAVEL_RELATED is violated the receipt needs to be audited.",
7+
"needs_audit": true
8+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,39 @@
1+
{
2+
"merchant": "ARCO GASOLINE",
3+
"location": {
4+
"city": "Vista",
5+
"state": "CA",
6+
"zipcode": null
7+
},
8+
"time": "2023-01-20T08:45:00",
9+
"items": [
10+
{
11+
"description": "E-85",
12+
"product_code": null,
13+
"category": "Fuel",
14+
"item_price": "2.699",
15+
"sale_price": null,
16+
"quantity": "13.268",
17+
"total": "35.81"
18+
},
19+
{
20+
"description": "debitfee",
21+
"product_code": null,
22+
"category": "Fee",
23+
"item_price": null,
24+
"sale_price": null,
25+
"quantity": "1",
26+
"total": "0.35"
27+
}
28+
],
29+
"subtotal": null,
30+
"tax": null,
31+
"total": "36.16",
32+
"handwritten_notes": [
33+
"vista-> yos",
34+
"sequoia",
35+
"yos",
36+
"206618",
37+
"2023"
38+
]
39+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,27 @@
1+
{
2+
"merchant": "Costco #124",
3+
"location": {
4+
"city": "Vista",
5+
"state": "CA",
6+
"zipcode": "92083"
7+
},
8+
"time": "2024-04-09T12:52:00",
9+
"items": [
10+
{
11+
"description": "Regular",
12+
"product_code": null,
13+
"category": "Fuel",
14+
"item_price": "4.959",
15+
"sale_price": "4.959",
16+
"quantity": "10.005",
17+
"total": "49.61"
18+
}
19+
],
20+
"subtotal": "49.61",
21+
"tax": null,
22+
"total": "49.61",
23+
"handwritten_notes": [
24+
"vista",
25+
"219948"
26+
]
27+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,28 @@
1+
{
2+
"merchant": "Fuel Mart",
3+
"location": {
4+
"city": "San Bernardino",
5+
"state": "CA",
6+
"zipcode": "92417"
7+
},
8+
"time": "2024-07-07T17:47:46",
9+
"items": [
10+
{
11+
"description": "REG CR #09",
12+
"product_code": null,
13+
"category": "Fuel",
14+
"item_price": "4.199",
15+
"sale_price": null,
16+
"quantity": "14.507G",
17+
"total": "60.91"
18+
}
19+
],
20+
"subtotal": "60.91",
21+
"tax": null,
22+
"total": "60.91",
23+
"handwritten_notes": [
24+
"224014",
25+
"Nissan",
26+
"X"
27+
]
28+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,28 @@
1+
{
2+
"merchant": "Chukchansi Crossing",
3+
"location": {
4+
"city": "Coarsegold",
5+
"state": "CA",
6+
"zipcode": "93614"
7+
},
8+
"time": "2024-12-18T22:10:05",
9+
"items": [
10+
{
11+
"description": "SUPER",
12+
"product_code": null,
13+
"category": "Fuel",
14+
"item_price": "3.599",
15+
"sale_price": null,
16+
"quantity": "20.032",
17+
"total": "72.10"
18+
}
19+
],
20+
"subtotal": "72.10",
21+
"tax": null,
22+
"total": "72.10",
23+
"handwritten_notes": [
24+
"232658",
25+
"Nissan",
26+
"home -> yos"
27+
]
28+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,54 @@
1+
{
2+
"merchant": "Kohl's",
3+
"location": {
4+
"city": "Oceanside",
5+
"state": "CA",
6+
"zipcode": "92056"
7+
},
8+
"time": "2023-01-12T15:12:00",
9+
"items": [
10+
{
11+
"description": "BATH RUGS",
12+
"product_code": "40076499017",
13+
"category": "Home Goods",
14+
"item_price": "13.99",
15+
"sale_price": "9.79",
16+
"quantity": "1",
17+
"total": "9.79"
18+
},
19+
{
20+
"description": "BATH RUGS",
21+
"product_code": "40076499017",
22+
"category": "Home Goods",
23+
"item_price": "13.99",
24+
"sale_price": "4.89",
25+
"quantity": "1",
26+
"total": "4.89"
27+
},
28+
{
29+
"description": "FLOOR CARE",
30+
"product_code": "62235658793",
31+
"category": "Cleaning Supplies",
32+
"item_price": "329.99",
33+
"sale_price": "209.99",
34+
"quantity": "1",
35+
"total": "209.99"
36+
},
37+
{
38+
"description": "BAKEWARE",
39+
"product_code": "07089662604",
40+
"category": "Kitchenware",
41+
"item_price": "39.99",
42+
"sale_price": "28.00",
43+
"quantity": "1",
44+
"total": "28.00"
45+
}
46+
],
47+
"subtotal": "252.67",
48+
"tax": "20.85",
49+
"total": "273.52",
50+
"handwritten_notes": [
51+
"yos",
52+
"2023"
53+
]
54+
}
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,28 @@
1+
{
2+
"merchant": "Vons",
3+
"location": {
4+
"city": "Oakhurst",
5+
"state": "CA",
6+
"zipcode": "93644"
7+
},
8+
"time": "2024-10-14T20:36:29",
9+
"items": [
10+
{
11+
"description": "10-Unleaded",
12+
"product_code": null,
13+
"category": "Fuel",
14+
"item_price": "4.119",
15+
"sale_price": null,
16+
"quantity": "12.026",
17+
"total": "49.54"
18+
}
19+
],
20+
"subtotal": null,
21+
"tax": null,
22+
"total": "49.54",
23+
"handwritten_notes": [
24+
"home -> Yos",
25+
"Sequoia",
26+
"237407"
27+
]
28+
}

0 commit comments

Comments
 (0)