WIP, move split calculation to its own class

Start removal of Gradio and streamlit
2025-01-12 21:50:05 -06:00 · 2025-01-12 20:19:02 -06:00
4 changed files with 949 additions and 866 deletions
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -5,11 +5,11 @@ description = "Add your description here"
 readme = "README.md"
 requires-python = ">=3.11"
 dependencies = [
-    "gradio>=5.9.1",
    "great-tables>=0.15.0",
    "more-itertools>=10.5.0",
    "ollama>=0.4.4",
    "polars>=1.18.0",
+    "reflex>=0.6.8",
    "selenium>=4.27.1",
    "surya-ocr>=0.8.1",
 ]
--- a/src/app/gradio_ui.py
+++ b/src/app/gradio_ui.py
@@ -1,625 +0,0 @@
-from datetime import datetime
-from typing import Literal, TypedDict, TypeVar
-
-import argparse as agp
-import gradio as gr
-import polars as pl
-from PIL.Image import Image
-
-from src.app.split_ai import ReceiptReader
-from src.app.utils import css_code, head_html, spinner_html
-
-ComponentType = TypeVar("ComponentType")
-
-
-def calculate_splits(
-    item_names: list[str],
-    item_people: list[list[str]],
-    item_amounts: list[float],
-    total: float,
-    tip: float,
-    tax: float,
-    people_list: list[str],
-    tip_split_proportionally: bool,
-    tax_split_proportionally: bool,
-    cashback_discount: float,
-    return_detailed_table: bool = False,
-) -> gr.DataFrame:
-    """
-    A simple, but long function to calculate splits for a provided receipt.
-
-    Args:
-        item_names: Names of the items being split.
-        item_people: A list of people for each item who are splitting its cost.
-        item_amounts: Amounts of the items being split.
-        total: The total amount in the receipt
-        tip: The tip in the receipt
-        tax: The tax in the receipt
-        people_list: The total number of people splitting the receipt.
-        tip_split_proportionally: Indicator for whether the tip is split proportional to pre-tax/tip cost.
-        tax_split_proportionally: Indicator for whether the tax is split proportional to pre-tax/tip cost.
-        cashback_discount: The total will be reduced by this percentage value.
-        return_detailed_table: Indicator to return full calculation table or a simplified one.
-
-    Returns:
-        A DataFrame form of the provided values along with their calculated splits or a simplified version.
-    """
-    split_count = 0
-    unsplit_names = []
-    checkbox_count = len(item_people)
-    for name, split in zip(item_names, item_people):
-        if len(split) > 0:
-            split_count += 1
-        else:
-            unsplit_names.append(name)
-    if split_count != checkbox_count:
-        gr.Warning(
-            f"Pending splits: {','.join(unsplit_names)}",
-            title="Can't show splits yet",
-        )
-        return gr.DataFrame(pl.DataFrame(), visible=False)
-    else:
-        # Deliberately avoiding going the numpy route here since the data is very small anyway.
-        split_arrays: list[list[float]] = []
-        for split in item_people:
-            split_array = [1 / len(split) if x in split else 0.0 for x in people_list]
-            split_arrays.append(split_array)
-        split_amounts: list[list[float]] = []
-        for split_array, amount in zip(split_arrays, item_amounts):
-            split_amount = [amount * split for split in split_array]
-            split_amounts.append(split_amount)
-
-        split_subtotals = [sum(x) for x in zip(*split_amounts)]
-        subtotal = total - tip - tax
-        split_tips = [
-            x / subtotal * tip if tip_split_proportionally else tax / len(people_list)
-            for x in split_subtotals
-        ]
-        split_taxes = [
-            x / subtotal * tax if tax_split_proportionally else tax / len(people_list)
-            for x in split_subtotals
-        ]
-        split_totals_pre_cashback = [
-            split_subtotal + split_tip + split_tax
-            for split_subtotal, split_tip, split_tax in zip(
-                split_subtotals, split_tips, split_taxes
-            )
-        ]
-        split_cashback = [-x * cashback_discount for x in split_totals_pre_cashback]
-        split_totals_post_cashback = [
-            x * (1 - cashback_discount) for x in split_totals_pre_cashback
-        ]
-        first_col_names = list(item_names) + [
-            "Subtotal",
-            "Tip",
-            "Tax",
-            "Cashback",
-            "Total",
-        ]
-        splits = split_amounts + [
-            split_subtotals,
-            split_tips,
-            split_taxes,
-            split_cashback,
-            split_totals_post_cashback,
-        ]
-        horizontal_totals = list(item_amounts) + [
-            subtotal,
-            tip,
-            tax,
-            sum(split_cashback),
-            sum(split_totals_post_cashback),
-        ]
-        full_calculation_df = (
-            pl.DataFrame(
-                {
-                    "Item": first_col_names,
-                    "splits": splits,
-                    "Total": horizontal_totals,
-                },
-                schema={
-                    "Item": pl.String,
-                    "splits": pl.List(pl.Float64),
-                    "Total": pl.Float64,
-                },
-            )
-            .with_columns(pl.col("splits").list.to_struct(fields=people_list))
-            .unnest("splits")
-            .with_columns(pl.col(pl.Float64).round(2))
-        )
-        if return_detailed_table:
-            return gr.DataFrame(full_calculation_df, visible=True)
-        else:
-            simple_calculation = (
-                full_calculation_df.filter(pl.col("Item").eq("Total"))
-                .select(pl.exclude("Total"))
-                .transpose(
-                    include_header=True, header_name="Person", column_names=["Split"]
-                )
-                .filter(pl.col("Person").ne("Item"))
-            )
-            return gr.DataFrame(simple_calculation, visible=True)
-
-
-class Item(TypedDict):
-    name: str
-    amount: float
-
-
-class ItemSplitter:
-    def __init__(
-        self,
-        item: Item,
-        people_list: list[str],
-    ) -> None:
-        self.people_list_state = people_list
-        self.item = item
-        self.no_interaction_kwargs = {"interactive": False, "min_width": 10}
-        self.interaction_kwargs = self.no_interaction_kwargs | {
-            "container": False,
-            "interactive": True,
-        }
-
-    def name_textbox(self, item_name: str) -> gr.Textbox:
-        return gr.Textbox(
-            item_name, show_label=False, scale=8, **self.interaction_kwargs
-        )
-
-    def amount_number(self, item_amount: float) -> gr.Number:
-        return gr.Number(
-            value=item_amount, precision=2, scale=3, **self.interaction_kwargs
-        )
-
-    def split_status_button(
-        self, choices: list[str] | None = None, status: Literal["⚠️", "🆗"] = "⚠️"
-    ) -> gr.Button:
-        if choices is not None:
-            if len(choices) == 0:
-                status = "⚠️"
-            else:
-                status = "🆗"
-        else:
-            choices = []
-        variant: Literal["huggingface", "primary"] = (
-            "huggingface" if (status == "⚠️") | (len(choices) == 0) else "primary"
-        )
-        return gr.Button(
-            value=status, variant=variant, scale=1, **self.no_interaction_kwargs
-        )
-
-    def delete_item(self, item_list: list[Item]) -> list[Item]:
-        item_list.remove(self.item)
-        return item_list
-
-    def delete_item_button(self) -> gr.Button:
-        kwargs = self.no_interaction_kwargs | {"interactive": True}
-        return gr.Button(value="❌", variant="stop", **kwargs)
-
-    def people_list_checkbox(self, people_list: list[str]) -> gr.CheckboxGroup:
-        return gr.CheckboxGroup(choices=people_list, **self.interaction_kwargs)
-
-    def generate(self) -> tuple[gr.Textbox, gr.CheckboxGroup, gr.Number, gr.Button]:
-        return self.generate_mobile()
-
-    def generate_mobile(self):
-        with gr.Row(variant="default", equal_height=True):
-            item_name_textbox = self.name_textbox(self.item["name"])
-            item_amount_number = self.amount_number(self.item["amount"])
-            split_status_button = self.split_status_button(status="⚠️")
-            delete_item_button = self.delete_item_button()
-        people_list_checkbox = self.people_list_checkbox(self.people_list_state)
-        people_list_checkbox.change(
-            lambda x: self.split_status_button(choices=x),
-            people_list_checkbox,
-            split_status_button,
-        )
-        return (
-            item_name_textbox,
-            people_list_checkbox,
-            item_amount_number,
-            delete_item_button,
-        )
-
-
-class SplitAIApp:
-    valid_split_variant: Literal["primary"] = "primary"
-    invalid_split_variant: Literal["huggingface"] = "huggingface"
-
-    def __init__(self, llm_model: str):
-        self.receipt_reader = ReceiptReader(llm_model)
-        self.demo = self.create_app()
-
-    @staticmethod
-    def prepare_calculate_splits_kwargs(num_records: int, *all_values) -> gr.DataFrame:
-        """
-        This method is necessary because only a list[gr.Component] or similar can be sent as
-        `inputs` to an event listener. Therefore, it is unpacked here and prepared into a
-        dictionary based on how it is sent by the event. This method is specifically for
-        the `get_split_button.click` event listener.
-
-        Args:
-            num_records: The number of items present to split.
-            *all_values: A list of components to forward to `calculate_splits`.
-
-        Returns:
-            gr.DataFrame
-        """
-        kwargs = {
-            "item_names": all_values[:num_records],
-            "item_people": all_values[num_records : num_records * 2],
-            "item_amounts": all_values[num_records * 2 : num_records * 3],
-        }
-        additional_kwargs = {
-            k: v
-            for k, v in zip(
-                [
-                    "total",
-                    "tip",
-                    "tax",
-                    "people_list",
-                    "tip_split_proportionally",
-                    "tax_split_proportionally",
-                    "cashback_discount",
-                    "return_detailed_table",
-                ],
-                tuple(all_values[num_records * 3 :]),
-            )
-        }
-        additional_kwargs["cashback_discount"] /= 100
-        kwargs.update(additional_kwargs)
-        return calculate_splits(**kwargs)
-
-    @staticmethod
-    def update_component_attributes(
-        component: ComponentType, **kwargs
-    ) -> ComponentType:
-        """
-        This requirement is in place because Gradio expects you to provide A NEW INSTANCE of
-        the component that you want to update with its attributes changed. It seems like it
-        doesn't replace the component, but updates it this way. Very weird behavior.
-
-        Args:
-            component: The gradio component to update attributes for.
-            **kwargs: (attribute, value) pairs to update in child.
-
-        Returns:
-            A new instance of child's class with the updated attributes.
-        """
-        gradio_class = type(component)
-        try:
-            return gradio_class(**kwargs)
-        except Exception as err:
-            print(
-                f"The Gradio component {gradio_class} does not have one of the provided attribute keys."
-            )
-            raise err
-
-    @staticmethod
-    def validate_people_list(people_textbox) -> tuple[gr.Image, list]:
-        if "," in people_textbox and people_textbox[-1] != ",":
-            people_list = [x.strip() for x in people_textbox.split(",")]
-            return gr.Image(interactive=True), people_list
-        else:
-            gr.Warning("You need to enter a list of names separated by commas.")
-            return gr.Image(interactive=False), []
-
-    def create_app(self) -> gr.Blocks():
-        # `head_html` required to prevent iOS from scaling the UI when clicking on a textbox.
-        with gr.Blocks(
-            css=css_code,
-            head=head_html,
-            theme="JohnSmith9982/small_and_pretty",
-            fill_width=True,
-        ) as split_app:
-            with gr.Column():
-                self.people_textbox = gr.Textbox(
-                    placeholder="Split names with a comma",
-                    label="Who all are splitting this receipt?",
-                    lines=1,
-                    autofocus=True,
-                    submit_btn="Submit",
-                )
-                self.people_list = gr.State([])
-                self.image_uploader = gr.Image(
-                    show_label=False, scale=1, type="pil", interactive=False
-                )
-                self.people_textbox.submit(
-                    SplitAIApp.validate_people_list,
-                    [self.people_textbox],
-                    [self.image_uploader, self.people_list],
-                )
-            with gr.Column():
-                with gr.Column():
-                    with gr.Row():
-                        self.merchant = gr.Textbox(
-                            interactive=True,
-                            label="Merchant Name",
-                            min_width=20,
-                            visible=False,
-                            scale=2,
-                        )
-                        self.receipt_date = gr.DateTime(
-                            interactive=True,
-                            include_time=False,
-                            type="datetime",
-                            label="Date",
-                            min_width=20,
-                            visible=False,
-                            scale=1,
-                        )
-                    with gr.Row():
-                        self.total_amount = gr.Number(
-                            interactive=True,
-                            label="Total",
-                            minimum=0,
-                            min_width=20,
-                            visible=False,
-                            precision=2,
-                        )
-                        self.tip_amount = gr.Number(
-                            interactive=True,
-                            label="Tip",
-                            min_width=20,
-                            minimum=0,
-                            visible=False,
-                            precision=2,
-                        )
-                        self.tax_amount = gr.Number(
-                            interactive=True,
-                            label="Tax",
-                            minimum=0,
-                            min_width=20,
-                            visible=False,
-                            precision=2,
-                        )
-                self.items = gr.State([])
-
-                @gr.render(inputs=[self.items, self.people_list])
-                def render_items(items: list[Item], people_list: list[str]):
-                    item_names = []
-                    item_peoples = []
-                    item_amounts = []
-                    for key, item in enumerate(items):
-                        with gr.Column(variant="compact"):
-                            splitter = ItemSplitter(item, people_list)
-                            item_name, item_people, item_amount, delete_item_button = (
-                                splitter.generate()
-                            )
-                            # This event needs to be defined outside the ItemSplitter class
-                            # because it references a gr.State variable. All Gradio components
-                            # can be properly pass ONLY via event listeners, as their state is
-                            # managed by Gradio outside the flow of the Python app.
-                            delete_item_button.click(
-                                splitter.delete_item, self.items, self.items
-                            )
-                            item_names.append(item_name)
-                            item_peoples.append(item_people)
-                            item_amounts.append(item_amount)
-
-                    self.split_tip_proportionally = gr.Checkbox(
-                        value=True,
-                        label="Split tip proportional to other costs",
-                        info="If unchecked, will split equally.",
-                        interactive=True,
-                    )
-                    self.split_tax_proportionally = gr.Checkbox(
-                        value=True,
-                        label="Split tax proportional to other costs",
-                        info="If unchecked, will split equally.",
-                        interactive=True,
-                    )
-                    self.add_cashback_discount = gr.Number(
-                        minimum=0,
-                        maximum=100,
-                        value=0,
-                        step=0.5,
-                        label="Cashback discount to apply on total",
-                        info="Choose a number between 0% and 100%.",
-                        interactive=True,
-                    )
-                    self.show_detailed_table = gr.Checkbox(
-                        value=False,
-                        label="Show a detailed calculation table",
-                        info="If unchecked, will just show the splits.",
-                        interactive=True,
-                    )
-
-                    with gr.Row():
-                        self.integrity_markdown = gr.Markdown(
-                            show_label=False, value="", visible=False
-                        )
-
-                    with gr.Row():
-                        get_splits_button = gr.Button(
-                            "Get Splits", variant="primary", scale=5, min_width=10
-                        )
-                        get_splits_button.click(
-                            lambda *x: SplitAIApp.prepare_calculate_splits_kwargs(
-                                len(item_names), *x
-                            ),
-                            inputs=(
-                                item_names
-                                + item_peoples
-                                + item_amounts
-                                + [
-                                    self.total_amount,
-                                    self.tip_amount,
-                                    self.tax_amount,
-                                    self.people_list,
-                                    self.split_tip_proportionally,
-                                    self.split_tax_proportionally,
-                                    self.add_cashback_discount,
-                                    self.show_detailed_table,
-                                ]
-                            ),
-                            outputs=self.display_result,
-                        )
-
-                        add_item_button = gr.Button(
-                            "➕", variant="secondary", scale=1, min_width=10
-                        )
-
-                        def add_item(
-                            items: list[Item],
-                        ):
-                            new_item_name = f"Item {len(items)+1}"
-                            return items + [
-                                {
-                                    "name": new_item_name,
-                                    "amount": 0.0,
-                                }
-                            ]
-
-                        add_item_button.click(
-                            add_item,
-                            inputs=[self.items],
-                            outputs=[self.items],
-                        )
-
-                    # Constantly keep track of whether totals match or not.
-                    def integrity_checker(*args) -> gr.Markdown:
-                        items = args[: len(args) - 3]
-                        tip_amount, tax_amount, total_amount = args[len(args) - 3 :]
-                        subtotal = sum(items)
-                        if subtotal + tip_amount + tax_amount != total_amount:
-                            return gr.Markdown(
-                                f"⚠️ Looks like the total ({total_amount}) doesn't match the value of subtotal ({subtotal}) + tip ({tip_amount}) + tax ({tax_amount}) ⚠️",
-                                show_label=False,
-                                visible=True,
-                            )
-                        else:
-                            return gr.Markdown(visible=False)
-
-                    gr.on(
-                        triggers=[x.change for x in item_amounts]
-                        + [
-                            self.tip_amount.change,
-                            self.tax_amount.change,
-                            self.total_amount.change,
-                        ],
-                        fn=integrity_checker,
-                        inputs=item_amounts
-                        + [
-                            self.tip_amount,
-                            self.tax_amount,
-                            self.total_amount,
-                        ],
-                        outputs=[self.integrity_markdown],
-                    )
-
-            self.display_result = gr.DataFrame(value=None, visible=False)
-
-            self.spinner_html = gr.HTML(
-                spinner_html,
-                visible=False,
-                padding=False,
-            )
-
-            self.image_uploader.upload(
-                lambda: gr.HTML(visible=True), inputs=None, outputs=self.spinner_html
-            ).then(
-                self.process_image,
-                inputs=[self.image_uploader, self.items],
-                outputs=[
-                    self.merchant,
-                    self.receipt_date,
-                    self.total_amount,
-                    self.tip_amount,
-                    self.tax_amount,
-                    self.items,
-                ],
-                show_progress="hidden",
-            ).then(
-                lambda: gr.HTML(visible=False), inputs=None, outputs=self.spinner_html
-            )
-
-        return split_app
-
-    def process_image(
-        self,
-        image: Image,
-        items: gr.State,
-    ):  # -> gr.State:
-        receipt_string = self.receipt_reader.get_ordered_text(image)
-        receipt_extracted = self.receipt_reader.extract_components(receipt_string)
-        print(receipt_extracted)
-        # receipt_extracted = {
-        #     "merchant": "FUBAR",
-        #     "receipt_date": datetime.now(),
-        #     "total": 15,
-        #     "tip": 0,
-        #     "tax": 3,
-        #     "item_amounts": [
-        #         {"name": "PET TOY", "currency": "$", "amount": 2},
-        #         {"name": "FLOPPY PUPPY", "currency": "$", "amount": 4},
-        #         {"name": "SSSUPREME S", "currency": "$", "amount": 6},
-        #     ],
-        # }
-        key_value_updates = [
-            {
-                "component": self.merchant,
-                "kwargs": {"value": receipt_extracted["merchant"], "visible": True},
-            },
-            {
-                "component": self.receipt_date,
-                "kwargs": {
-                    "value": receipt_extracted["receipt_date"],
-                    "visible": True,
-                },
-            },
-            {
-                "component": self.total_amount,
-                "kwargs": {
-                    "value": receipt_extracted["total"],
-                    "visible": True,
-                },
-            },
-            {
-                "component": self.tip_amount,
-                "kwargs": {
-                    "value": receipt_extracted["tip"],
-                    "visible": True,
-                },
-            },
-            {
-                "component": self.tax_amount,
-                "kwargs": {
-                    "value": receipt_extracted["tax"],
-                    "visible": True,
-                },
-            },
-        ]
-        out = [
-            self.update_component_attributes(x["component"], **x["kwargs"])
-            for x in key_value_updates
-        ]
-        items += [
-            {"name": x["name"], "amount": x["amount"]}
-            for x in receipt_extracted["receipt_items"]
-        ]
-        out += [items]
-        return out
-
-    def launch(self, expose_to_local_network: bool = False):
-        if expose_to_local_network:
-            self.demo.queue().launch(server_name="0.0.0.0", server_port=7860)
-        else:
-            self.demo.queue().launch()
-
-
-def arg_parser() -> agp.ArgumentParser:
-    ag = agp.ArgumentParser()
-    ag.add_argument(
-        "-m",
-        "--model",
-        type=str,
-        default="qwen2.5:7b",
-        help="Choose the LLM model used.",
-    )
-    return ag
-
-
-if __name__ == "__main__":
-    args = arg_parser().parse_args()
-    demo = SplitAIApp(args.model)
-    demo.launch(True)
--- a/src/core/split.py
+++ b/src/core/split.py
@@ -0,0 +1,275 @@
+import polars as pl
+
+
+class IncompleteSplitError(Exception):
+    def __init__(
+        self,
+        message,
+    ):
+        super().__init__(message)
+
+
+class SplitCalculator:
+    """
+    A simple, but long class to calculate splits for a provided receipt.
+
+    Args:
+        item_names: Names of the items being split.
+        item_people: A list of people for each item who are splitting its cost.
+        item_amounts: Amounts of the items being split.
+        total: The total amount in the receipt
+        tip: The tip in the receipt
+        tax: The tax in the receipt
+        people_list: The total number of people splitting the receipt.
+        tip_split_proportionally: Indicator for whether the tip is split proportional to pre-tax/tip cost.
+        tax_split_proportionally: Indicator for whether the tax is split proportional to pre-tax/tip cost.
+        cashback_discount: The total will be reduced by this percentage value.
+        return_detailed_table: Indicator to return full calculation table or a simplified one.
+    """
+
+    def __init__(
+        self,
+        item_names: list[str],
+        item_people: list[list[str]],
+        item_amounts: list[float],
+        receipt_total: float,
+        receipt_tip: float,
+        receipt_tax: float,
+        people_list: list[str],
+        tip_split_proportionally: bool,
+        tax_split_proportionally: bool,
+        cashback_discount: float,
+        return_detailed_table: bool = False,
+    ):
+        self.item_names = item_names
+        self.item_people = item_people
+        self.item_amounts = item_amounts
+        self.receipt_total = receipt_total
+        self.receipt_tip = receipt_tip
+        self.receipt_tax = receipt_tax
+        self.people_list = people_list
+        self.tip_split_proportionally = tip_split_proportionally
+        self.tax_split_proportionally = tax_split_proportionally
+        self.cashback_discount = cashback_discount
+        self.return_detailed_table = return_detailed_table
+
+        self.subtotal = self.receipt_total - self.receipt_tip - self.receipt_tax
+        self.split_tips: float | None = None
+        self.split_taxes: float | None = None
+
+    def validate_splits(self):
+        split_count = 0
+        unsplit_names = []
+        for name, split in zip(self.item_names, self.item_people):
+            if len(split) > 0:
+                split_count += 1
+            else:
+                unsplit_names.append(name)
+        if split_count != len(self.item_people):
+            raise IncompleteSplitError(
+                f"The following items have not been assigned splits: {','.join(unsplit_names)}"
+            )
+
+    def distribute_amount(self, amount: float, split_subtotals: list[float]):
+        """
+        Distribute `amount` equally, or distribute it proportionally, among
+        all the people involved in the split.
+        """
+        return [
+            x / self.subtotal * amount
+            if self.tax_split_proportionally
+            else amount / len(self.people_list)
+            for x in split_subtotals
+        ]
+
+    def subtract_cashback(
+        self, split_totals: list[float]
+    ) -> tuple[list[float], list[float]]:
+        split_cashback = [-x * cashback_discount for x in split_totals]
+        split_totals_minus_cashback = [
+            x * (1 - cashback_discount) for x in split_totals
+        ]
+        return split_cashback, split_totals_minus_cashback
+
+    def forward(self):
+        split_arrays: list[list[float]] = []
+        for split in self.item_people:
+            split_array = [
+                1 / len(split) if x in split else 0.0 for x in self.people_list
+            ]
+            split_arrays.append(split_array)
+        split_amounts: list[list[float]] = []
+        for split_array, amount in zip(split_arrays, self.item_amounts):
+            split_amount = [amount * split for split in split_array]
+            split_amounts.append(split_amount)
+
+        split_subtotals = [sum(x) for x in zip(*split_amounts)]
+        split_tips = self.distribute_amount(self.receipt_tip, split_subtotals)
+        split_taxes = self.distribute_amount(self.receipt_tax, split_subtotals)
+
+        split_totals = [
+            split_subtotal + split_tip + split_tax
+            for split_subtotal, split_tip, split_tax in zip(
+                split_subtotals, split_tips, split_taxes
+            )
+        ]
+        split_cashback, split_totals_minus_cashback = self.subtract_cashback(
+            split_totals
+        )
+
+
+def calculate_splits(
+    item_names: list[str],
+    item_people: list[list[str]],
+    item_amounts: list[float],
+    total: float,
+    tip: float,
+    tax: float,
+    people_list: list[str],
+    tip_split_proportionally: bool,
+    tax_split_proportionally: bool,
+    cashback_discount: float,
+    return_detailed_table: bool = False,
+) -> pl.DataFrame:
+    """
+    A simple, but long function to calculate splits for a provided receipt.
+
+    Args:
+        item_names: Names of the items being split.
+        item_people: A list of people for each item who are splitting its cost.
+        item_amounts: Amounts of the items being split.
+        total: The total amount in the receipt
+        tip: The tip in the receipt
+        tax: The tax in the receipt
+        people_list: The total number of people splitting the receipt.
+        tip_split_proportionally: Indicator for whether the tip is split proportional to pre-tax/tip cost.
+        tax_split_proportionally: Indicator for whether the tax is split proportional to pre-tax/tip cost.
+        cashback_discount: The total will be reduced by this percentage value.
+        return_detailed_table: Indicator to return full calculation table or a simplified one.
+
+    Returns:
+        A DataFrame form of the provided values along with their calculated splits or a simplified version.
+    """
+    split_count = 0
+    unsplit_names = []
+    checkbox_count = len(item_people)
+    for name, split in zip(item_names, item_people):
+        if len(split) > 0:
+            split_count += 1
+        else:
+            unsplit_names.append(name)
+    if split_count != checkbox_count:
+        raise IncompleteSplitError(
+            f"The following items have not been assigned splits: {','.join(unsplit_names)}"
+        )
+        return None
+    else:
+        # Deliberately avoiding going the numpy route here since the data is very small anyway.
+        split_arrays: list[list[float]] = []
+        for split in item_people:
+            split_array = [1 / len(split) if x in split else 0.0 for x in people_list]
+            split_arrays.append(split_array)
+        split_amounts: list[list[float]] = []
+        for split_array, amount in zip(split_arrays, item_amounts):
+            split_amount = [amount * split for split in split_array]
+            split_amounts.append(split_amount)
+
+        split_subtotals = [sum(x) for x in zip(*split_amounts)]
+        subtotal = total - tip - tax
+        split_tips = [
+            x / subtotal * tip if tip_split_proportionally else tax / len(people_list)
+            for x in split_subtotals
+        ]
+        split_taxes = [
+            x / subtotal * tax if tax_split_proportionally else tax / len(people_list)
+            for x in split_subtotals
+        ]
+        split_totals_pre_cashback = [
+            split_subtotal + split_tip + split_tax
+            for split_subtotal, split_tip, split_tax in zip(
+                split_subtotals, split_tips, split_taxes
+            )
+        ]
+        split_cashback = [-x * cashback_discount for x in split_totals_pre_cashback]
+        split_totals_post_cashback = [
+            x * (1 - cashback_discount) for x in split_totals_pre_cashback
+        ]
+        first_col_names = list(item_names) + [
+            "Subtotal",
+            "Tip",
+            "Tax",
+            "Cashback",
+            "Total",
+        ]
+        splits = split_amounts + [
+            split_subtotals,
+            split_tips,
+            split_taxes,
+            split_cashback,
+            split_totals_post_cashback,
+        ]
+        horizontal_totals = list(item_amounts) + [
+            subtotal,
+            tip,
+            tax,
+            sum(split_cashback),
+            sum(split_totals_post_cashback),
+        ]
+        full_calculation_df = (
+            pl.DataFrame(
+                {
+                    "Item": first_col_names,
+                    "splits": splits,
+                    "Total": horizontal_totals,
+                },
+                schema={
+                    "Item": pl.String,
+                    "splits": pl.List(pl.Float64),
+                    "Total": pl.Float64,
+                },
+            )
+            .with_columns(pl.col("splits").list.to_struct(fields=people_list))
+            .unnest("splits")
+            .with_columns(pl.col(pl.Float64).round(2))
+        )
+        if return_detailed_table:
+            return full_calculation_df
+        else:
+            simple_calculation = (
+                full_calculation_df.filter(pl.col("Item").eq("Total"))
+                .select(pl.exclude("Total"))
+                .transpose(
+                    include_header=True, header_name="Person", column_names=["Split"]
+                )
+                .filter(pl.col("Person").ne("Item"))
+            )
+            return simple_calculation
+
+
+if __name__ == "__main__":
+    # Example usage
+    item_names = ["Item 1", "Item 2", "Item 3"]
+    item_people = [["Alice", "Bob"], ["Alice"], ["Bob", "Charlie"]]
+    item_amounts = [10.0, 20.0, 30.0]
+    total = 70.0
+    tip = 6.0
+    tax = 4.0
+    people_list = ["Alice", "Bob", "Charlie"]
+    tip_split_proportionally = True
+    tax_split_proportionally = True
+    cashback_discount = 0.03
+
+    result_df = calculate_splits(
+        item_names,
+        item_people,
+        item_amounts,
+        total,
+        tip,
+        tax,
+        people_list,
+        tip_split_proportionally,
+        tax_split_proportionally,
+        cashback_discount,
+        return_detailed_table=True,
+    )
+    print(result_df)
--- a/uv.lock
+++ b/uv.lock
Author	SHA1	Message	Date
Avinash Mallya	ce147d0e08	WIP, move split calculation to its own class	2025-01-12 21:50:05 -06:00
Avinash Mallya	a86f856ec4	Start removal of Gradio and streamlit	2025-01-12 20:19:02 -06:00