diff --git a/notebooks/analysis.ipynb b/notebooks/analysis.ipynb new file mode 100644 index 0000000..313290e --- /dev/null +++ b/notebooks/analysis.ipynb @@ -0,0 +1,391 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 15, + "id": "a0dcf44b-c609-4701-8007-b270cf8c3d35", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + " | tcin | \n", + "gtin13 | \n", + "ingestion_time | \n", + "primary_category | \n", + "materials | \n", + "packaging | \n", + "origin | \n", + "weight | \n", + "height | \n", + "width | \n", + "depth | \n", + "ingestion_time | \n", + "material_score | \n", + "weight_score | \n", + "packaging_score | \n", + "origin_score | \n", + "score | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", + "81917300 | \n", + "840391145528 | \n", + "2023-06-25 20:31:00.725924 | \n", + "Toys | \n", + "None | \n", + "1 | \n", + "imported | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "2023-06-25 20:31:00.725924 | \n", + "0.625000 | \n", + "NaN | \n", + "0.6 | \n", + "0.0 | \n", + "NaN | \n", + "
1 | \n", + "84821007 | \n", + "9781801433983 | \n", + "2023-06-25 20:31:00.736690 | \n", + "School & Office Supplies | \n", + "[cardboard] | \n", + "1 | \n", + "imported | \n", + "NaN | \n", + "NaN | \n", + "30.23 | \n", + "NaN | \n", + "2023-06-25 20:31:00.736690 | \n", + "0.253333 | \n", + "NaN | \n", + "0.6 | \n", + "0.0 | \n", + "NaN | \n", + "
2 | \n", + "15432753 | \n", + "883929408115 | \n", + "2023-06-25 20:31:00.742077 | \n", + "Movies, Music & Books | \n", + "None | \n", + "1 | \n", + "usa | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "2023-06-25 20:31:00.742077 | \n", + "NaN | \n", + "NaN | \n", + "0.6 | \n", + "1.0 | \n", + "NaN | \n", + "
3 | \n", + "84199597 | \n", + "194425194489 | \n", + "2023-06-25 20:31:00.746501 | \n", + "Party Supplies | \n", + "[cardboard] | \n", + "24 | \n", + "imported | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "2023-06-25 20:31:00.746501 | \n", + "0.625000 | \n", + "NaN | \n", + "14.4 | \n", + "0.0 | \n", + "NaN | \n", + "
4 | \n", + "86345566 | \n", + "23271231140 | \n", + "2023-06-25 20:31:00.751118 | \n", + "Home | \n", + "[metal] | \n", + "1 | \n", + "imported | \n", + "2109.20 | \n", + "58.42 | \n", + "2.54 | \n", + "58.42 | \n", + "2023-06-25 20:31:00.751118 | \n", + "0.353333 | \n", + "1581.9000 | \n", + "0.6 | \n", + "0.0 | \n", + "1582.853333 | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
162 | \n", + "83388852 | \n", + "4717592035292 | \n", + "2023-06-25 20:31:01.380622 | \n", + "Sports & Outdoors | \n", + "[plastic] | \n", + "1 | \n", + "mixed | \n", + "127.01 | \n", + "NaN | \n", + "12.70 | \n", + "24.13 | \n", + "2023-06-25 20:31:01.380622 | \n", + "0.366667 | \n", + "95.2575 | \n", + "0.6 | \n", + "0.5 | \n", + "96.724167 | \n", + "
163 | \n", + "80836585 | \n", + "841821016982 | \n", + "2023-06-25 20:31:01.384865 | \n", + "Patio & Garden | \n", + "None | \n", + "1 | \n", + "mixed | \n", + "14514.94 | \n", + "30.48 | \n", + "30.48 | \n", + "NaN | \n", + "2023-06-25 20:31:01.384865 | \n", + "0.112500 | \n", + "10886.2050 | \n", + "0.6 | \n", + "0.5 | \n", + "10887.417500 | \n", + "
164 | \n", + "75477923 | \n", + "93422863070 | \n", + "2023-06-25 20:31:01.388505 | \n", + "Holiday Shop | \n", + "[fabric] | \n", + "1 | \n", + "mixed | \n", + "78.64 | \n", + "12.06 | \n", + "5.71 | \n", + "5.71 | \n", + "2023-06-25 20:31:01.388505 | \n", + "0.403571 | \n", + "58.9800 | \n", + "0.6 | \n", + "0.5 | \n", + "60.483571 | \n", + "
165 | \n", + "85634544 | \n", + "194425213968 | \n", + "2023-06-25 20:31:01.391389 | \n", + "Household Essentials | \n", + "None | \n", + "1 | \n", + "imported | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "2023-06-25 20:31:01.391389 | \n", + "NaN | \n", + "NaN | \n", + "0.6 | \n", + "0.0 | \n", + "NaN | \n", + "
166 | \n", + "80239765 | \n", + "724235717129 | \n", + "2023-06-25 20:31:01.394481 | \n", + "Kitchen & Dining | \n", + "[stoneware] | \n", + "1 | \n", + "imported | \n", + "829.60 | \n", + "11.43 | \n", + "31.75 | \n", + "11.43 | \n", + "2023-06-25 20:31:01.394481 | \n", + "NaN | \n", + "622.2000 | \n", + "0.6 | \n", + "0.0 | \n", + "NaN | \n", + "
167 rows × 17 columns
\n", + "