In [4]:
import json
import pandas as pd

def process_data_in_chunks(file_path, chunk_size=10000):
    # This list will hold the current chunk of data
    chunk_data = []
    
    with open(file_path, 'r') as file:
        for i, line in enumerate(file):
            try:
                # Parse JSON data
                json_data = json.loads(line)
                chunk_data.append(json_data)
                
                # If the current chunk size reaches the chunk_size or end of file
                if len(chunk_data) >= chunk_size:
                    yield pd.DataFrame(chunk_data)
                    chunk_data = []  # Reset for the next chunk
            except json.JSONDecodeError:
                print(f"Error: Invalid JSON format on line {i}")
    
    # Yield any remaining data as the last chunk
    if chunk_data:
        yield pd.DataFrame(chunk_data)

# Example of how to use this function
for df_chunk in process_data_in_chunks('Sampled_Amazon_Meta.json'):
    print(df_chunk.head())  # Process each chunk, e.g., print, analyze, or save


                                            category tech1  \
0  [Clothing, Shoes & Jewelry, Men, Clothing, Jea...         
1  [Clothing, Shoes & Jewelry, Women, Accessories...         
2  [Clothing, Shoes & Jewelry, Women, Clothing, L...         
3  [Clothing, Shoes & Jewelry, Women, Clothing, D...         
4  [Clothing, Shoes & Jewelry, Women, Clothing, L...         

                                         description  \
0  [<b>pant size(Unit:inch)</b><br> W30(tag30) Wa...   
1  [Feature <br> -Great quality winter scarf. <br...   
2  [Material : Core-spun fabric silk <br> feature...   
3  [Material : Core-spun fabric silk <br> feature...   
4  [Material : Core-spun fabric silk <br> feature...   

                                                 fit  \
0   class="a-normal a-align-center a-spacing-smal...   
1                                                      
2   class="a-normal a-align-center a-spacing-smal...   
3   class="a-normal a-align-center a-spacing-smal...   
4         

                                            category tech1  \
0  [Clothing, Shoes & Jewelry, Women, Jewelry, Br...         
1  [Clothing, Shoes & Jewelry, Women, Jewelry, Br...         
2  [Clothing, Shoes & Jewelry, Women, Jewelry, Br...         
3  [Clothing, Shoes & Jewelry, Women, Jewelry, Br...         
4  [Clothing, Shoes & Jewelry, Women, Jewelry, Br...         

                                         description  \
0                                                 []   
1  [, An amazing work of art! This cicada bug is ...   
2  [There's a serene expression on the maiden's f...   
3  [This trusty steed will be perfect for any hor...   
4  [Like a moth drawn to a light, we are totally ...   

                                                 fit  \
0   class="a-normal a-align-center a-spacing-smal...   
1                                                      
2                                                      
3                                                      
4         

                                            category tech1  \
0  [Clothing, Shoes & Jewelry, Women, Jewelry, Ea...         
1  [Clothing, Shoes & Jewelry, Men, Jewelry, Ring...         
2  [Clothing, Shoes & Jewelry, Novelty & More, Cl...         
3  [Clothing, Shoes & Jewelry, Men, Surf, Skate &...         
4  [Clothing, Shoes & Jewelry, Women, Clothing, A...         

                                         description  \
0                                                 []   
1  [Solid Sterling Silver "LOVE, LOYALTY, FRIENDS...   
2                                                 []   
3  [A classic of years past and for years to come...   
4  [One of Soffe's classics juniors shorts in a n...   

                                                 fit  \
0                                                      
1                                                      
2                                                      
3   class="a-normal a-align-center a-spacing-smal...   
4   class=

                                            category tech1  \
0  [Clothing, Shoes & Jewelry, Shoe, Jewelry & Wa...         
1  [Clothing, Shoes & Jewelry, Shoe, Jewelry & Wa...         
2  [Clothing, Shoes & Jewelry, Shoe, Jewelry & Wa...         
3  [Clothing, Shoes & Jewelry, Shoe, Jewelry & Wa...         
4  [Clothing, Shoes & Jewelry, Shoe, Jewelry & Wa...         

                                         description  \
0  [The Fashion Shoelaces series are made exclusi...   
1  [These Shoe Laces are 100% Cotton Shoelaces. F...   
2  [These Heavy Duty ROUND Boot Laces are a great...   
3  [The Fashion Shoelaces series are made exclusi...   
4  [These shoelaces come in a variety of colors a...   

                                                 fit  \
0   class="a-normal a-align-center a-spacing-smal...   
1   class="a-normal a-align-center a-spacing-smal...   
2   class="a-normal a-align-center a-spacing-smal...   
3   class="a-normal a-align-center a-spacing-smal...   
4   class=

                                            category tech1  \
0  [Clothing, Shoes & Jewelry, Novelty & More, Cl...         
1  [Clothing, Shoes & Jewelry, Women, Jewelry, Ri...         
2  [Clothing, Shoes & Jewelry, Women, Jewelry, Ri...         
3  [Clothing, Shoes & Jewelry, Novelty & More, Cl...         
4  [Clothing, Shoes & Jewelry, Women, Jewelry, Ri...         

                                         description  \
0                                                 []   
1  [This piece of jewelry would be a wonderful ad...   
2  [This piece of jewelry would be a wonderful ad...   
3  [Lace fishnet halter garter dress with opaque ...   
4  [This piece of jewelry would be a wonderful ad...   

                                                 fit  \
0                                                      
1                                                      
2                                                      
3   class="a-normal a-align-center a-spacing-smal...   
4         

                                            category tech1  \
0  [Clothing, Shoes & Jewelry, Women, Handbags & ...         
1  [Clothing, Shoes & Jewelry, Women, Jewelry, Ne...         
2  [Clothing, Shoes & Jewelry, Women, Watches, Wr...         
3  [Clothing, Shoes & Jewelry, Women, Jewelry, Ea...         
4  [Clothing, Shoes & Jewelry, Women, Clothing, S...         

                                         description fit  \
0  [Out of Print pouch bag with a Edgar Allen Poe...       
1  [This is our Flagship Firefighter Charm inlaid...       
2  [Pulsar, Night Out, Women's Watch, Stainless S...       
3                                                 []       
4  [Suprisingly functional, supremely attractive ...       

                                               title  \
0                     Out of Print Poe-ka Dots Pouch   
1  Firefighter Fireman Shield Clear Crystal Red E...   
2  Pulsar Women's PP6106 Analog Display Japanese ...   
3  WithLoveSilver 925 Sterling Silver Teen

                                            category tech1  \
0   [Clothing, Shoes & Jewelry, Women, Shoes, Flats]         
1  [Clothing, Shoes & Jewelry, Men, Shoes, Boots,...         
2  [Clothing, Shoes & Jewelry, Men, Accessories, ...         
3  [Clothing, Shoes & Jewelry, Women, Jewelry, Ne...         
4  [Clothing, Shoes & Jewelry, Women, Jewelry, Ne...         

                                         description  \
0                                                 []   
1  [Rugged style and reliability wrap up in the m...   
2  [, <b>Polarized Lens Replacement Compatible wi...   
3  [, <strong>Immerse Yourself In The Chic Elegan...   
4                                                 []   

                                                 fit  \
0                                                      
1   class="a-normal a-align-center a-spacing-smal...   
2                                                      
3                                                      
4         

                                            category tech1  \
0                 [Clothing, Shoes & Jewelry, Women]         
1  [Clothing, Shoes & Jewelry, Men, Jewelry, Earr...         
2  [Clothing, Shoes & Jewelry, Men, Jewelry, Earr...         
3  [Clothing, Shoes & Jewelry, Men, Shoes, Loafer...         
4  [Clothing, Shoes & Jewelry, Men, Jewelry, Earr...         

                                         description  \
0  [*Color 01<br>*Condition: 100% brand new<br>*C...   
1  [*Style 01<br>*Condition: 100% brand new<br>*C...   
2  [*Condition: 100% brand new <br /> *Material: ...   
3  [The Keen Men's Portsmouth Shoes keep your fee...   
4  [*Condition: 100% brand new<br>*Code: ME-30F<b...   

                                                 fit  \
0                                                      
1                                                      
2                                                      
3   class="a-normal a-align-center a-spacing-smal...   
4         

                                            category tech1  \
0  [Clothing, Shoes & Jewelry, Women, Shoes, Leat...         
1  [Clothing, Shoes & Jewelry, Women, Shoes, Leat...         
2  [Clothing, Shoes & Jewelry, Women, Shoes, Leat...         
3  [Clothing, Shoes & Jewelry, Women, Shoes, Leat...         
4  [Clothing, Shoes & Jewelry, Novelty & More, Cl...         

                                         description  \
0  [L'Arstiste by Spring Step Santorini is a hand...   
1  [L'Arstiste by Spring Step Santorini is a hand...   
2  [L'Arstiste by Spring Step Santorini is a hand...   
3  [L'Arstiste by Spring Step Santorini is a hand...   
4  [Black Beanie/Pentagram Logo - Have Your Favor...   

                                                 fit  \
0   class="a-normal a-align-center a-spacing-smal...   
1   class="a-normal a-align-center a-spacing-smal...   
2   class="a-normal a-align-center a-spacing-smal...   
3   class="a-normal a-align-center a-spacing-smal...   
4         

                                            category tech1  \
0  [Clothing, Shoes & Jewelry, Men, Watches, Watc...         
1  [Clothing, Shoes & Jewelry, Men, Uniforms, Wor...         
2  [Clothing, Shoes & Jewelry, Women, Jewelry, Ne...         
3  [Clothing, Shoes & Jewelry, Men, Jewelry, Neck...         
4   [Clothing, Shoes & Jewelry, Girls, Shoes, Flats]         

                                         description  \
0                                                 []   
1  [Work environments can be unpredictable, but t...   
2  [Very comfortable, very stylish. Great quality...   
3  [Very comfortable, very stylish. Great quality...   
4              [Girls Sporty Mary Jane With Sequins]   

                                                 fit  \
0   class="a-normal a-align-center a-spacing-smal...   
1   class="a-normal a-align-center a-spacing-smal...   
2                                                      
3                                                      
4   class=

                                            category tech1  \
0  [Clothing, Shoes & Jewelry, Novelty & More, Cl...         
1  [Clothing, Shoes & Jewelry, Novelty & More, Cl...         
2  [Clothing, Shoes & Jewelry, Novelty & More, Cl...         
3  [Clothing, Shoes & Jewelry, Novelty & More, Cl...         
4  [Clothing, Shoes & Jewelry, Novelty & More, Cl...         

                                         description  \
0                                                 []   
1  [Ripple Junction Officially Licensed Firefly T...   
2  [Ripple Junction Officially Licensed Gintama T...   
3  [Buddy the Elf knows how exciting it can be to...   
4  [Smiling is Buddy the Elfs favorite. Not only ...   

                                                 fit  \
0   class="a-normal a-align-center a-spacing-smal...   
1                                                      
2                                                      
3   class="a-normal a-align-center a-spacing-smal...   
4   class=

                                            category tech1  \
0  [Clothing, Shoes & Jewelry, Women, Shoes, Sand...         
1          [Clothing, Shoes & Jewelry, Women, Shoes]         
2  [Clothing, Shoes & Jewelry, Men, Shoes, Athlet...         
3  [Clothing, Shoes & Jewelry, Women, Shoes, Sand...         
4  [Clothing, Shoes & Jewelry, Men, Shoes, Athlet...         

                                         description  \
0  [Your peers will take notice of your style whe...   
1  [Smart and stylish, Ambers four straps adjust ...   
2  [Dedicated XC, Cyclo-Cross no compromise racin...   
3  [The Dwyn's faux wood grain wedge takes a wear...   
4  [Dedicated XC, Cyclo-Cross no compromise racin...   

                                                 fit  \
0   class="a-normal a-align-center a-spacing-smal...   
1   class="a-normal a-align-center a-spacing-smal...   
2                                                      
3   class="a-normal a-align-center a-spacing-smal...   
4         

                                            category tech1  \
0  [Clothing, Shoes & Jewelry, Women, Jewelry, Je...         
1  [Clothing, Shoes & Jewelry, Women, Clothing, D...         
2  [Clothing, Shoes & Jewelry, Women, Clothing, D...         
3  [Clothing, Shoes & Jewelry, Women, Handbags & ...         
4   [Clothing, Shoes & Jewelry, Men, Shoes, Sandals]         

                                         description  \
0                    [Package Include: \n<br> 1 set]   
1                                                 []   
2                                                 []   
3                                                 []   
4  [Timeless slide sandal style merges with our o...   

                                                 fit  \
0                                                      
1   class="a-normal a-align-center a-spacing-smal...   
2                                                      
3                                                      
4   class=

                                            category tech1  \
0       [Clothing, Shoes & Jewelry, Girls, Clothing]         
1  [Clothing, Shoes & Jewelry, Men, Clothing, Act...         
2  [Clothing, Shoes & Jewelry, Luggage & Travel G...         
3                 [Clothing, Shoes & Jewelry, Women]         
4  [Clothing, Shoes & Jewelry, Men, Clothing, Act...         

                                         description  \
0  [eTree Girls' double layers, pants with skirts...   
1                                                 []   
2  [Available in a wide range of color combinatio...   
3                                                 []   
4                                                 []   

                                                 fit  \
0   class="a-normal a-align-center a-spacing-smal...   
1   class="a-normal a-align-center a-spacing-smal...   
2                                                      
3   class="a-normal a-align-center a-spacing-smal...   
4   class=

                                            category tech1  \
0  [Clothing, Shoes & Jewelry, Men, Accessories, ...         
1  [Clothing, Shoes & Jewelry, Men, Jewelry, Body...         
2  [Clothing, Shoes & Jewelry, Women, Accessories...         
3  [Clothing, Shoes & Jewelry, Women, Clothing, S...         
4  [Clothing, Shoes & Jewelry, Women, This fashio...         

                                         description  \
0                                                 []   
1  [You are buying 2 Pieces (One Pair) of 14G(1.6...   
2                                                 []   
3  [DJT Womens Long Sleeve Knit Sweater Dress Siz...   
4  [<b>Women's Princess Renaissance Corset Floral...   

                                                 fit  \
0   class="a-normal a-align-center a-spacing-smal...   
1                                                      
2                                                      
3   class="a-normal a-align-center a-spacing-smal...   
4   class=

                                            category tech1  \
0  [Clothing, Shoes & Jewelry, Men, Shoes, Imported]         
1  [Clothing, Shoes & Jewelry, Men, Shoes, Imported]         
2  [Clothing, Shoes & Jewelry, Women, Shoes, Fash...         
3  [Clothing, Shoes & Jewelry, Men, Shoes, Oxford...         
4  [Clothing, Shoes & Jewelry, Men, Shoes, Imported]         

                                         description  \
0                                                 []   
1                                                 []   
2                                  [Fashion sneaker]   
3  [Our Story: Conal International Trading Incorp...   
4                                                 []   

                                                 fit  \
0                                                      
1   class="a-normal a-align-center a-spacing-smal...   
2   class="a-normal a-align-center a-spacing-smal...   
3   class="a-normal a-align-center a-spacing-smal...   
4   class=

                                            category tech1 description  \
0       [Clothing, Shoes & Jewelry, Girls, Clothing]                []   
1  [Clothing, Shoes & Jewelry, Baby, Baby Boys, C...                []   
2  [Clothing, Shoes & Jewelry, Boys, Clothing, Sl...                []   
3  [Clothing, Shoes & Jewelry, Baby, Baby Girls, ...                []   
4  [Clothing, Shoes & Jewelry, Men, Clothing, Shi...                []   

                                                 fit  \
0                                                      
1   class="a-normal a-align-center a-spacing-smal...   
2   class="a-normal a-align-center a-spacing-smal...   
3   class="a-normal a-align-center a-spacing-smal...   
4   class="a-normal a-align-center a-spacing-smal...   

                                               title  \
0         Carter's Girls' 2 Pc Playwear Sets 259g141   
1     Carter's Baby Boys' 2 Pc Playwear Sets 229g132   
2                 Carter's Boys' 4 Pc Cotton 341g0

                                            category tech1  \
0  [Clothing, Shoes & Jewelry, Women, Shoes, Boot...         
1  [Clothing, Shoes & Jewelry, Women, Clothing, J...         
2  [Clothing, Shoes & Jewelry, Novelty & More, Cl...         
3  [Clothing, Shoes & Jewelry, Women, Shoes, 100%...         
4  [Clothing, Shoes & Jewelry, Women, Shoes, Sand...         

                                         description  \
0  [Cute unlined bootie, Jessica Simpson is famou...   
1  [Five pocket skinny-straight leg pant with bac...   
2  [Waist Up Brendon Wearing Red Jacket Against B...   
3  [Dressy pump, Jessica Simpson is famous for he...   
4  [Sexy platform sandal, Jessica Simpson is famo...   

                                                 fit  \
0   class="a-normal a-align-center a-spacing-smal...   
1   class="a-normal a-align-center a-spacing-smal...   
2   class="a-normal a-align-center a-spacing-smal...   
3   class="a-normal a-align-center a-spacing-smal...   
4   class=

                                            category tech1  \
0  [Clothing, Shoes & Jewelry, Women, Clothing, S...         
1  [Clothing, Shoes & Jewelry, Women, Clothing, D...         
2  [Clothing, Shoes & Jewelry, Women, Clothing, D...         
3  [Clothing, Shoes & Jewelry, Luggage & Travel G...         
4  [Clothing, Shoes & Jewelry, Luggage & Travel G...         

                                         description  \
0  [<br>Size chart: <br>S/US 0-2: Bust: 32.5-33.5...   
1  [, attention, although this dress has stretchy...   
2                                                 []   
3  [ThiKin Backpack Features: <br> - Mainly made ...   
4                                                 []   

                                                 fit  \
0   class="a-normal a-align-center a-spacing-smal...   
1                                                      
2   class="a-normal a-align-center a-spacing-smal...   
3                                                      
4         

                                            category tech1  \
0  [Clothing, Shoes & Jewelry, Women, Shoes, Pump...         
1  [Clothing, Shoes & Jewelry, Women, A pattern w...         
2  [Clothing, Shoes & Jewelry, Women, Jewelry, Ea...         
3  [Clothing, Shoes & Jewelry, Men, Accessories, ...         
4  [Clothing, Shoes & Jewelry, Men, Surf, Skate &...         

                                         description fit  \
0  [</br> </br> </br><b>MONICOCO is a global bran...       
1  [The owner of "tanezo.jp" shop is a native Jap...       
2                                                 []       
3  [Complement any outfit with this smooth leathe...       
4  [Special features include: polar fleece shirt....       

                                               title  \
0  MONICOCO Women's Stilettos Studded T-Strap Pum...   
1  T2C American Flag Long Maxi Dress Women's USA ...   
2  SELOVO Teardrop Drop Dangle Earrings Silver To...   
3  Nautica Men's Reversible Dress Belt wit

                                            category tech1  \
0  [Home & Kitchen, Kitchen & Dining, Dining & En...         
1  [Home & Kitchen, Heating, Cooling & Air Qualit...         
2  [Home & Kitchen, Heating, Cooling & Air Qualit...         
3  [Home & Kitchen, Heating, Cooling & Air Qualit...         
4  [Home & Kitchen, Kitchen & Dining, Cookware, R...         

                                         description fit  \
0  [032677493267 Features: -Fluted pattern. -Dish...       
1  [For 2.7 Gallon Output Cool Mist Humidifiers. ...       
2  [This HEPA Filter is the fast and easy-to-repl...       
3  [This HEPA Filter is the fast and easy-to-repl...       
4  [, Americas favorite roaster! Granite Ware Roa...       

                                               title  \
0     Wedgwood Night &amp; Day Bone China Fluted Mug   
1  Hamilton Beach 05910 TrueAir Cool Mist Humidif...   
2  Hamilton Beach 04912 TrueAir HEPA Replacement ...   
3  Hamilton Beach 04913 TrueAir HEPA Repla

                                            category tech1  \
0  [Home & Kitchen, Kitchen & Dining, Dining & En...         
1  [Home & Kitchen, Kitchen & Dining, Dining & En...         
2  [Home & Kitchen, Kitchen & Dining, Storage & O...         
3  [Home & Kitchen, Kitchen & Dining, Bakeware, P...         
4  [Home & Kitchen, Kitchen & Dining, Cookware, A...         

                                         description fit  \
0  [Ideal for displaying meats, fruits or vegetab...       
1  [Ideal for displaying meats, fruits or vegetab...       
2  [The word kraft means strong in German. Kraft ...       
3  [<div class="aplus">, The Handi-Foil 30430 alu...       
4  [Ridged aluminum foil pan provides superior qu...       

                                               title  \
0  Genpak 10SWH Supermarket Trays, Foam, White, 1...   
1  Genpak 17SWH 8-1/4-Inch Length by 4-3/4-Inch W...   
2  Boardwalk K3650612 Kraft Paper, 36 in x 612 ft...   
3  Handi-Foil of America 30430 Aluminum Pi

                                            category  \
0  [Home & Kitchen, Storage & Organization, Cloth...   
1  [Home & Kitchen, Home Dcor, Window Treatments,...   
2  [Home & Kitchen, Storage & Organization, Laund...   
3  [Home & Kitchen, Bedding, Kids' Bedding, Blank...   
4  [Home & Kitchen, Bedding, Comforters & Sets, C...   

                                               tech1  \
0   class="a-keyvalue prodDetTable" role="present...   
1                                                      
2                                                      
3                                                      
4                                                      

                                         description fit  \
0  [The Babies R Us 2-Pack Clip Hangers offer 2 s...       
1  [The Echo Window Valance measures 53.5 inches ...       
2  [The Disney Pixar Monsters University Pop Up H...       
3            [Disney's Little Mermaid Micro Raschel]       
4  [Can you smell what The

                                            category tech1  \
0  [Home & Kitchen, Kitchen & Dining, Storage & O...         
1  [Home & Kitchen, Kitchen & Dining, Storage & O...         
2  [Home & Kitchen, Kitchen & Dining, Kitchen Ute...         
3  [Home & Kitchen, Kitchen & Dining, Storage & O...         
4  [Home & Kitchen, Kitchen & Dining, Bakeware, C...         

                                         description fit  \
0  [The Premium Black Mylar Foil Open Top Pouch i...       
1  [The Premium Black Mylar Foil Open Top Pouch i...       
2                                                 []       
3  [The Premium Silver Mylar Foil Open Top Pouch ...       
4  [Here is a flexible resin mold that can be use...       

                                               title  \
0  100x Premium Black Mylar Foil Open Top Pouch +...   
1  100x Premium Glossy Black Mylar Foil Open Top ...   
2  Professional Wine Opener by HiCoup &ndash; Ros...   
3  100x Premium Silver Mylar Open Top Bags

                                            category tech1  \
0  [Home & Kitchen, Kitchen & Dining, Kitchen Ute...         
1  [Home & Kitchen, Bedding, Bed Pillows & Positi...         
2  [Home & Kitchen, Kitchen & Dining, Storage & O...         
3                  [Home & Kitchen, Bath, Bath Rugs]         
4           [Home & Kitchen, Event & Party Supplies]         

                                         description fit  \
0                                                 []       
1                                                 []       
2  [Savel is a flexible food saver that covers cu...       
3  [Microban antimicrobial product protection inh...       
4  [Palm Tree and Parrot Fanci-frames (1/pkg) Pkg...       

                                               title  \
0  Barvivo Professional Waiters Corkscrew This Wi...   
1  NeckSnug - Luxury Travel Pillow - 100% Memory ...   
2  Dreamfarm DFSA6704 Savel Food Saver, Assorted ...   
3  Microban Antimicrobial Memory Foam, Non

                                            category  \
0  [Home & Kitchen, Home Dcor, Area Rugs, Runners...   
1  [Home & Kitchen, Kitchen & Dining, Kitchen Ute...   
2  [Home & Kitchen, Kitchen & Dining, Dining & En...   
3  [Home & Kitchen, Home Dcor, Home Dcor Accents,...   
4  [Home & Kitchen, Kitchen & Dining, Bakeware, D...   

                                               tech1  \
0   class="a-keyvalue prodDetTable" role="present...   
1                                                      
2                                                      
3                                                      
4                                                      

                                         description fit  \
0  [Forget those boring, plain mats that somehow ...       
1  [The BREKX Hillcrest Copper Finish Pebbled Bev...       
2             [Booker and Dax Cocktail Shaking Cube]       
3  [Our light-weight and delightful hand fans are...       
4  [Celebrate Christmas wi

                                            category tech1  \
0  [Home & Kitchen, Kitchen & Dining, Kitchen & T...         
1  [Home & Kitchen, Kitchen & Dining, Dining & En...         
2  [Home & Kitchen, Kitchen & Dining, Storage & O...         
3  [Home & Kitchen, Kitchen & Dining, Storage & O...         
4  [Home & Kitchen, Bath, Bathroom Accessories, S...         

                                         description fit  \
0                                                 []       
1  [The best 90th birthday gift is a practical gi...       
2  [Is your fridge or freezer a huge mess and you...       
3  [Is your fridge or freezer a huge mess and you...       
4  [Add life to your bathroom decor with this chi...       

                                               title  \
0  Chelsea Home Set of 4 Reversible Cloth Place M...   
1  90th Birthday Gifts For All Took 90 Years Awes...   
2  Scotty's (TM) Refrigerator, Freezer, and Pantr...   
3  Scotty's TM Clear Refrigerator, Freezer

                                            category tech1  \
0  [Books, Politics & Social Sciences, Politics &...         
1                  [Books, Self-Help, Relationships]         
2  [Books, Christian Books &amp; Bibles, Bible St...         
3  [Books, Teen &amp; Young Adult, Literature &am...         
4  [Books, Business &amp; Money, Marketing &amp; ...         

                                         description fit  \
0  [&#8220;This book tells what should have been ...       
1  [, <em>After the Affair</em> teaches partners ...       
2  [It contains insights and commentary by a wide...       
3  [Praise for Pretty Little Liars: Shepard does ...       
4  [a lively, thought-provoking, and often humoro...       

                                               title  \
0  Mossad: The Greatest Missions of the Israeli S...   
1  After the Affair: Healing the Pain and Rebuild...   
2  The Love Wins Companion: A Study Guide for Tho...   
3  Pretty Little Liars: Pretty Little Secr

                                            category tech1  \
0                         [Books, History, Military]         
1            [Books, Literature & Fiction, Literary]         
2  [Books, Reference, Writing, Research & Publish...         
3                     [Books, Biographies & Memoirs]         
4   [Books, New, Used & Rental Textbooks, Reference]         

                                         description fit  \
0                                     [Unusual book]       
1  [Georges Simenon was born at Liege in Belgium ...       
2                                                 []       
3                                                 []       
4                                     [Unusual book]       

                                               title  \
0                     World War One: A Short History   
1            Maigret in Court (Penguin Red Classics)   
2  The Customs of the Kingdoms of India (Penguin ...   
3    Julie and Julia: My Year of Cooking D

                                            category tech1  \
0                          [Books, Children's Books]         
1  [Books, New, Used &amp; Rental Textbooks, Huma...         
2  [Books, Literature &amp; Fiction, History &amp...         
3                                                 []         
4  [Books, New, Used &amp; Rental Textbooks, Huma...         

                                         description fit  \
0                                               [, ]       
1  [While [Lynch] is learned enough about the lit...       
2  [Ralph C. Wood is University Professor of Theo...       
3                                                 []       
4  [[A]s the only English version of any edition ...       

                                               title  \
0                            Heidi (Classic Reprint)   
1  Images of Hope: Imagination as Healer of the H...   
2  The Comedy of Redemption: Christian Faith and ...   
3                            A Husband for

                                            category tech1  \
0  [Books, New, Used &amp; Rental Textbooks, Huma...         
1  [Books, Reference, Writing, Research &amp; Pub...         
2                                                 []         
3  [Books, Literature &amp; Fiction, History &amp...         
4  [Books, Reference, Writing, Research &amp; Pub...         

                                         description fit  \
0                                               [, ]       
1  [, This comprehensive anthology of contemporar...       
2                    [Fourth Grade Student Text, , ]       
3                                               [, ]       
4                                               [, ]       

                                               title  \
0  God Matters: Readings in the Philosophy of Rel...   
1              The Contemporary American Short Story   
2  Addison Wesley Math Makes Sense - 4 (Addison W...   
3  American Literature, Volume I (Penguin 

                                            category tech1  \
0  [Books, New, Used &amp; Rental Textbooks, Medi...         
1  [Books, Business &amp; Money, Management &amp;...         
2   [Books, Science &amp; Math, Biological Sciences]         
3  [Books, New, Used &amp; Rental Textbooks, Medi...         
4  [Books, Business &amp; Money, Management &amp;...         

                                         description fit  \
0  [From the reviews: "Given its broad coverage a...       
1  [, From the reviews:, "This book is a collecti...       
2  [, From the reviews of the second edition:, , ...       
3  [, From the reviews:, "In this introductory te...       
4  [, From the book reviews:, , , <em>Managerial ...       

                                               title  \
0  Subcortical Structures and Cognition: Implicat...   
1  Supply Chain Risk: A Handbook of Assessment, M...   
2                              The Machinery of Life   
3  Epidemiology and Biostatistics: An Intr

                                            category tech1  \
0  [Books, Mystery, Thriller &amp; Suspense, Myst...         
1  [Books, Mystery, Thriller &amp; Suspense, Myst...         
2                       [Books, Romance, Historical]         
3     [Books, Mystery, Thriller & Suspense, Mystery]         
4                       [Books, Romance, Historical]         

                                         description fit  \
0  [The fourth Shirley McClintock mystery has an ...       
1  [party in the Caribbean arranged by Lady Marga...       
2  [Flora, foliage and gardening lore don't make ...       
3  [Although I now live in New York City, there's...       
4  [The first romance in "The Sisters of Mercy Fl...       

                                               title  \
0                           Death and the Delinquent   
1  Perfect Day for Dying (A Lady Margaret Priam M...   
2                                     Time For Roses   
3                         We Wish You a Me

                                            category tech1  \
0  [Books, New, Used &amp; Rental Textbooks, Huma...         
1  [Books, New, Used &amp; Rental Textbooks, Busi...         
2  [Books, New, Used &amp; Rental Textbooks, Scie...         
3  [Books, Reference, Dictionaries &amp; Thesauru...         
4             [Books, Arts &amp; Photography, Music]         

                                         description fit  \
0  [This volume of the second edition of the Camb...       
1              [Book by Blaug, Mark; Mark Blaug, , ]       
2  ["Thoroughly researched, with copious links to...       
3  [' ... can quite safely be said to be the most...       
4          [Text: English, German (translation), , ]       

                                               title  \
0  The Cambridge Ancient History Volume 7, Part 2...   
1                      Economic Theory in Retrospect   
2  The Expanding Universe: Astronomy's 'Great Deb...   
3  Better English Pronunciation (Cambridge

                                    category tech1  \
0  [Books, Literature &amp; Fiction, Poetry]         
1     [Books, Arts &amp; Photography, Music]         
2                                         []         
3  [Books, Literature &amp; Fiction, Poetry]         
4     [Books, Arts &amp; Photography, Music]         

                                         description fit  \
0  [Kirk Diedrich is a writer, artist and self-co...       
1  ["...Some of the exercises here, while smartly...       
2  [Business leaders continually feel <i>Frustrat...       
3                                               [, ]       
4  [In the 1990s, an incredible underground revol...       

                                               title  \
0                                    Junk Shop Heart   
1  Advanced Rhythmic Concepts for Guitar; Forewor...   
2  Stop Being Frustrated &amp; Overcharged By You...   
3                                    Everything Neon   
4  Dancefloor Thunderstorm Land of

                                            category tech1  \
0  [Books, Mystery, Thriller &amp; Suspense, Myst...         
1  [Books, Children's Books, Geography &amp; Cult...         
2  [Books, Parenting & Relationships, Family Rela...         
3  [Books, Business &amp; Money, Marketing &amp; ...         
4          [Books, Business &amp; Money, Industries]         

                                         description fit  \
0  [, Suzanne Escott spent many years managing an...       
1  [Valerie Reynolds is a Chicago-based writer, m...       
2                                                 []       
3  [A serial entrepreneur, <b>Ryan Holmes</b> sta...       
4                                               [, ]       

                                               title  \
0                                The Antique Dealers   
1               The Joys of Being a Little Black Boy   
2     A Life Guide to Living Victoriously Over Abuse   
3                         The 4 Billion Do

                                            category tech1  \
0  [Books, Politics &amp; Social Sciences, Archae...         
1  [Books, Engineering &amp; Transportation, Tran...         
2  [Books, Engineering &amp; Transportation, Tran...         
3  [Books, Biographies &amp; Memoirs, Leaders &am...         
4                           [Books, History, Europe]         

                                         description fit  \
0                                           [, , , ]       
1                                           [, , , ]       
2                                       [, , , , , ]       
3                                           [, , , ]       
4  ["...if you did grow up in the 1950s then you ...       

                                               title  \
0                      Landscape Archaeology and GIS   
1                       The QE2 Story (Story series)   
2                       The QM2 Story (Story series)   
3                                  Our Man

                                            category tech1  \
0   [Books, Computers &amp; Technology, Programming]         
1  [Books, Computers &amp; Technology, Hardware &...         
2  [Books, Computers &amp; Technology, Certificat...         
3  [Books, Business &amp; Money, Management &amp;...         
4  [Books, Business &amp; Money, Management &amp;...         

                                         description fit  \
0  [Mastering VBA, Want to Get More From Office? ...       
1  [The late Seventies to the early Nineties was ...       
2  [<b>Prepare for the CEH certification exam wit...       
3  [usefulthis book is worth reading (<i>The Brit...       
4  [<b>Clear-Cut Ways to Manage Project Risk</b>,...       

                                               title  \
0                                      Mastering VBA   
1  Digital Retro: The Evolution and Design of the...   
2  CEH: Official Certified Ethical Hacker Review ...   
3  Herding Chickens: Innovative Techniques

                                            category tech1  \
0  [Books, Teen &amp; Young Adult, Literature &am...         
1  [Books, Reference, Writing, Research & Publish...         
2  [Books, Teen & Young Adult, Education & Refere...         
3   [Books, Test Preparation, College & High School]         
4  [Books, Teen &amp; Young Adult, Education &amp...         

                                         description fit  \
0  [Eoin Colfer (pronounced Owen) is a former ele...       
1  [Essays That Scored. Essays That Bored. <BR>Wh...       
2  [The experts at The Princeton Review have been...       
3                                                 []       
4  [The experts at The Princeton Review have been...       

                                               title  \
0                WARP Book 1: The Reluctant Assassin   
1  College Essays That Made a Difference, 6th Edi...   
2  Cracking the SAT Literature Subject Test, 15th...   
3  ACT Elite 36: Elite Prep for Advanced S

                                            category tech1  \
0  [Books, Crafts, Hobbies &amp; Home, Home Impro...         
1  [Books, Arts &amp; Photography, Photography &a...         
2  [Books, Cookbooks, Food & Wine, Regional & Int...         
3                         [Books, History, Americas]         
4  [Books, Crafts, Hobbies &amp; Home, Home Impro...         

                                         description fit  \
0  [Whether it's a studio apartment or a rambling...       
1  [hotographer Joel Sternfeld turns his exacting...       
2  [The great chef Patrick O'Connell went to coll...       
3  [Set to air February 10, the HBO documentary c...       
4                                               [, ]       

                                               title  \
0  Susan Sargent's The Comfort of Color: inspire ...   
1                                   Stranger Passing   
2  Patrick O'Connell's Refined American Cuisine: ...   
3  Unchained Memories: Readings from the S

                                            category tech1  \
0  [Books, Cookbooks, Food &amp; Wine, Cooking by...         
1                  [Books, Christian Books & Bibles]         
2   [Books, Children's Books, Education & Reference]         
3                                 [Books, Reference]         
4                            [Books, Travel, Africa]         

                                         description fit  \
0                                               [, ]       
1  [Lorraine Parkinson has been a parish minister...       
2                                                 []       
3  [1991 Becoming Literate: The Construction of I...       
4  [Henno Martin, born in 1910 in Freiburg, Germa...       

                                               title  \
0  Vegetables: Recipes and Techniques from the Wo...   
1  The World According to Jesus ... his blueprint...   
2  Cursive, Grades 2 - 4 (Handwriting Skill Build...   
3  Becoming Literate: The Construction of 

                                            category tech1  \
0  [Books, Crafts, Hobbies &amp; Home, Crafts &am...         
1                                                 []         
2       [Books, Arts & Photography, Performing Arts]         
3        [Books, Biographies &amp; Memoirs, Memoirs]         
4  [Books, Crafts, Hobbies & Home, Crafts & Hobbies]         

                                         description fit  \
0  [Excellent condition, clean, tight paperback p...       
1  [Drama, Plays, Theatre, Literature, Reading, L...       
2  [Richard Pilbrow first made his mark at Olivie...       
3  [<span>Through genuinelyheroic compassion, as ...       
4  [Sarah Thursfield has been supplying clothing ...       

                                               title  \
0  The Little Corset Book: A Workbook on Period U...   
1                              The Robber Bridegroom   
2  Stage Lighting Design: The Art, the Craft, the...   
3  The Fifth Season: A Daughter-in-Law's M

                                            category tech1  \
0                 [Books, Arts & Photography, Music]         
1                         [Books, History, Americas]         
2                         [Books, History, Military]         
3                                                 []         
4  [Books, Christian Books & Bibles, Christian Li...         

                                         description fit  \
0                                                 []       
1                                               [, ]       
2  [This publication documents all 86 Naval Air S...       
3  [Publisher: Farnsworth House Military Impressi...       
4  ["ONE THING YOU CAN'T DO IN HEAVEN BY MARK CAH...       

                                               title  \
0  What to Do on Thursday: A Layman's Guide to th...   
1        Postcards from Paradise: Romancing Key West   
2   United States Naval Air Stations of World War II   
3  &quot;Come on, you wolverines!&quot;: C

                                            category tech1  \
0                                                 []         
1  [Books, Children's Books, Mysteries &amp; Dete...         
2                       [Books, Romance, Historical]         
3  [Books, Children's Books, Mysteries &amp; Dete...         
4  [Books, Religion &amp; Spirituality, New Age &...         

                                         description fit  \
0  ["200,000 Years of Germanic World Culture and ...       
1  [With a background in paediatric nursing, Juli...       
2  [<span><b>***5 stars***</b>"Although this is c...       
3  [With a background in paediatric nursing, Juli...       
4  [<b>Sarah Prout</b> and <b>Sean Patrick Simpso...       

                                               title  \
0                         Atlantis, Edda &amp; Bible   
1  Frankie Dupont And The Lemon Festival Fiasco (...   
2  The Medium: An Emily Chambers Spirit Medium No...   
3  Frankie Dupont And The Science Fair Sab

                                            category tech1  \
0  [Books, Literature &amp; Fiction, History &amp...         
1  [Books, Engineering &amp; Transportation, Engi...         
2                                                 []         
3        [Books, Literature &amp; Fiction, Literary]         
4        [Books, Literature &amp; Fiction, Literary]         

                                         description fit  \
0                                               [, ]       
1  [Printed in Asia - Carries Same Contents as of...       
2  [This book is in Excellent condition. Only tak...       
3                                                 []       
4                                                 []       

                                               title  \
0                                      One-Upmanship   
1      Fluid Mechanics With Engineering Applications   
2          Project Management The Managerial Process   
3   Mechanical Springs: Their Engineering 

                                            category tech1  \
0  [Books, Teen &amp; Young Adult, Literature &am...         
1  [Books, Teen &amp; Young Adult, Literature &am...         
2        [Books, Comics &amp; Graphic Novels, Manga]         
3  [Books, Teen &amp; Young Adult, Literature &am...         
4  [Books, Teen &amp; Young Adult, Literature &am...         

                                         description fit  \
0  [Naoshi Komi was born in Kochi Prefecture, Jap...       
1                                               [, ]       
2                                               [, ]       
3  [Naoshi Komi was born in Kochi Prefecture, Jap...       
4  [Go Ikeyamada is a Gemini from Miyagi Prefectu...       

                                       title  \
0               Nisekoi: False Love, Vol. 12   
1  The Demon Prince of Momochi House, Vol. 2   
2                       Love Stage!!, Vol. 4   
3               Nisekoi: False Love, Vol. 10   
4                 So Cute 

                                            category tech1 description fit  \
0  [Books, Crafts, Hobbies &amp; Home, Home Impro...          [, , , ]       
1  [Books, Humor &amp; Entertainment, Puzzles &am...          [, , , ]       
2  [Books, Children's Books, Education &amp; Refe...              [, ]       
3  [Books, Cookbooks, Food &amp; Wine, Main Cours...          [, , , ]       
4  [Books, Humor &amp; Entertainment, Puzzles &am...          [, , , ]       

                                               title  \
0  Style &amp; Simplicity: An A to Z Guide to Liv...   
1  Infernally Hard Fireball Crosswords: 45 Ultra ...   
2  First Words/Primeras palabras (Say &amp; Play)...   
3  Salads: Fresh, Delicious Dishes for All Occasions   
4                              Double Trouble Sudoku   

                                            also_buy image tech2  \
0  [0310337909, 0804186278, 1452105944, 147674487...    []         
1  [1402790775, 1454910089, 1402790783, 145491645...    []

                                            category tech1  \
0  [Books, Reference, Foreign Language Study &amp...         
1               [Books, Religion &amp; Spirituality]         
2     [Books, Mystery, Thriller & Suspense, Mystery]         
3        [Books, Literature & Fiction, Contemporary]         
4  [Books, Mystery, Thriller &amp; Suspense, Myst...         

                                         description fit  \
0                                               [, ]       
1  [, Don Rude is a Christian layman, who lives i...       
2                                                 []       
3  [<b>"This novel is an arrow through the heart....       
4                                               [, ]       

                                               title  \
0  Spanish for the Physical Therapist: Bridging t...   
1  Simple Man Simple Prayer: Experience Renewal, ...   
2     Just Add Salt (Hetta Coffey Series) (Volume 2)   
3                                 The Memo

                                            category tech1  \
0  [Books, Self-Help, Communication & Social Skills]         
1  [Books, Health, Fitness &amp; Dieting, Alterna...         
2                 [Books, Arts & Photography, Music]         
3                         [Books, History, Americas]         
4                     [Books, Romance, Contemporary]         

                                         description fit  \
0                                                 []       
1  [Alexa Moore's book "Essential Oil" is<b>one o...       
2                                                 []       
3                                               [, ]       
4                                                 []       

                                               title  \
0  The People Skills Guide: Small Talk, Business ...   
1  Essential Oils: Ultimate Essential Oils Guide ...   
2                     The Cotton Picker - An Odyssey   
3     Finding Owl Canyon: Book One - 1875 

                                            category tech1  \
0  [Books, Children's Books, Computers &amp; Tech...         
1                         [Books, History, Americas]         
2  [Books, Christian Books &amp; Bibles, Literatu...         
3  [Books, Biographies & Memoirs, Arts & Literature]         
4          [Books, Literature &amp; Fiction, Poetry]         

                                         description fit  \
0                                               [, ]       
1  [Steven Hager was the first reporter to cover ...       
2  [, Taylor Michaels writes romantic suspense. A...       
3                                                 []       
4                                               [, ]       

                                               title  \
0  Unofficial Coloring Book With Jokes For Minecr...   
1                    Killing Kennedy: The Real Story   
2   Exit Wounds (Sonoran Security Agency) (Volume 3)   
3  Raised by Wolves: Growing up Poor in 19

                                            category tech1  \
0  [Books, Politics &amp; Social Sciences, Social...         
1  [Books, Arts &amp; Photography, Photography &a...         
2  [Books, Politics &amp; Social Sciences, Politi...         
3                         [Books, Law, Law Practice]         
4  [Books, New, Used & Rental Textbooks, Humanities]         

                                         description fit  \
0  [<i>Made in America</i> by Laurie Olsen, codir...       
1  [Colorado Skies (Colorado Littlebooks) \n\n(Vi...       
2  [Most accessible but not limited to graduate s...       
3                                       [, , , , , ]       
4  [If the 1962 Cuban Missile Crisis was the most...       

                                               title  \
0  Made in America: Immigrant Students in Our Pub...   
1  Colorado Skies: With Selected Prose &amp; Poet...   
2  Teaching for Social Justice: A Democracy and E...   
3  Critical Race Theory: The Key Writings 

                                            category tech1  \
0             [Books, Sports & Outdoors, Basketball]         
1  [Books, Christian Books &amp; Bibles, Bible St...         
2  [Books, Health, Fitness &amp; Dieting, Exercis...         
3  [Books, Sports &amp; Outdoors, Football (Ameri...         
4  [Books, Sports &amp; Outdoors, Other Team Sports]         

                                         description fit  \
0  [Cliff Ellis is the former head men s basketba...       
1                                               [, ]       
2                                    [Rare book, , ]       
3  [A very impressive collection and presentation...       
4  [Cecile Reynaud was the head women s volleybal...       

                                               title  \
0  Zone Press Variations for Winning Basketball (...   
1                                    Good News Bible   
2  Ace's Guide to Exercise Testing and Program De...   
3  Footballs Quick Passing Game (Art &amp;

                                            category tech1  \
0  [Books, Business &amp; Money, Management &amp;...         
1                     [Books, Romance, Contemporary]         
2             [Books, Literature & Fiction, Erotica]         
3         [Books, Literature &amp; Fiction, Erotica]         
4  [Books, Business &amp; Money, Management &amp;...         

                                         description fit  \
0                                               [, ]       
1  [<DIV>Shelley Bradley lives in Flower Mound, T...       
2  [A Little Harmless Sex by Melissa Schroeder is...       
3                                               [, ]       
4  [Margaret Seidler is an organization developme...       

                                               title  \
0  Collaborative Leadership in Action: A Field Gu...   
1                              Naughty Little Secret   
2                              A Little Harmless Sex   
3            The Ice Dragon (Dragon Knight

                                            category tech1  \
0  [Books, Christian Books & Bibles, Christian Li...         
1  [Books, Christian Books & Bibles, Christian Li...         
2  [Books, Christian Books & Bibles, Christian Li...         
3  [Books, Engineering & Transportation, Transpor...         
4  [Books, Engineering &amp; Transportation, Tran...         

                                         description fit  \
0  [My long-time friends, Stuart and Jill Briscoe...       
1  [David Apple's life is a story of mercy receiv...       
2  [Jill Briscoe is a highly-sought international...       
3                                                 []       
4                                           [, , , ]       

                                               title  \
0  Improving with Age: God's Plan for Getting Old...   
1  Not Just a Soup Kitchen: How Mercy Ministry in...   
2                                       Heartstrings   
3  The Flight Instructor's Survival Guide:

                                            category tech1  \
0  [Books, Crafts, Hobbies &amp; Home, Crafts &am...         
1                                                 []         
2  [Books, Children's Books, Education &amp; Refe...         
3  [Books, Religion &amp; Spirituality, New Age &...         
4                                                 []         

                                         description fit  \
0  [Barrington Barber is a renowned authority on ...       
1                                                 []       
2                                           [, , , ]       
3                                           [, , , ]       
4  [The Nazis kept extensive files on practically...       

                                               title  \
0                                   Anyone Can Paint   
1                              Convertible Submarine   
2    Adding and Subtracting Puzzle and Activity Book   
3         1001 Ways to Creativity (1001 Wa

                                            category tech1  \
0  [Books, Business &amp; Money, Management &amp;...         
1  [Books, Literature &amp; Fiction, Short Storie...         
2               [Books, Science &amp; Math, Physics]         
3                         [Books, History, Americas]         
4                                                 []         

                                         description fit  \
0  [I have thoroughly enjoyed your QI Macros soft...       
1                        [Book by Greene, J. R., , ]       
2  [Katya Walter has a Ph.D. with an interdiscipl...       
3  [Benjamin Franklin Awards - Silver Award for B...       
4  [Norman Gibat is an Electronics Engineer. In 1...       

                                               title  \
0  Six Sigma Simplified, 3rd ed - Breakthrough Im...   
1                     Strange Tales from Old Quabbin   
2  Double Bubble Universe: The Paradigm (God's TO...   
3  Superstition Wilderness Trails West: Hi

                                            category tech1  \
0   [Books, Literature &amp; Fiction, Genre Fiction]         
1  [Books, Comics &amp; Graphic Novels, Graphic N...         
2  [Books, Comics &amp; Graphic Novels, Graphic N...         
3                                                 []         
4   [Books, Comics & Graphic Novels, Graphic Novels]         

                                         description fit  \
0                                         [, , , , ]       
1  [When you've outgrown the shy schoolgirl roman...       
2  [Grade 10 UpNelson and various teams inject a ...       
3  [Sci-Fi Channels smash hit show returns in thi...       
4  [Grade 9 Up Created by H. P. Lovecraft in 1926...       

                                               title  \
0  What to Do When You Meet Cthulhu: A Guide to S...   
1                                     Voices Of Love   
2              Fall of Cthulhu Vol. 2: The Gathering   
3                         Eureka Vol 2: Do

                                            category tech1  \
0  [Books, Biographies & Memoirs, Arts & Literature]         
1  [Books, Business & Money, Small Business & Ent...         
2  [Books, Religion & Spirituality, New Age & Spi...         
3       [Books, Literature & Fiction, Genre Fiction]         
4         [Books, Science Fiction & Fantasy, Gaming]         

                                         description fit  \
0  [Barbara Salani Born in Caracas, Venezuela, fr...       
1  [Kim Gateb was born in New England and grew up...       
2  [Nifty Notebooks design beautiful <b>notebooks...       
3                                                 []       
4                                                 []       

                                               title  \
0                Music for Life: The Salani Brothers   
1                         The Entrepreneur's Journal   
2  Epic Ideas: Ideas Notebook Journal 120-Page Li...   
3                                         

                                            category tech1  \
0                                                 []         
1               [Books, Science & Math, Mathematics]         
2  [Books, Reference, Foreign Language Study &amp...         
3                                                 []         
4                                                 []         

                                         description fit  \
0  [This book illustrates clearly and cleverly ho...       
1  [Griddlers team is a leader of an online commu...       
2                                               [, ]       
3                                               [, ]       
4  [There are many well-known travel guides avail...       

                                               title  \
0         From Buffalo Burgers to Monetary Mysteries   
1  Griddlers Logic Puzzles: Black and White (Volu...   
2  To Succeed in Hebrew - A - Beginner's Level wi...   
3  The Garden of Healing:A Practical Guide

                                            category tech1  \
0                                                 []         
1                                                 []         
2  [Books, Crafts, Hobbies & Home, Crafts & Hobbies]         
3                                                 []         
4                                                 []         

                                         description fit  \
0                   [Jonathan Kozol Charles Keating]       
1  [The relationship of Regional Geology to the T...       
2  [, <i>Pulled Thread Embroidery Stitches</i> co...       
3  [Will be shipped from US. Used books may not i...       
4                                                 []       

                                               title  \
0  Playboy Magazine April 1992 (1-907, girls of t...   
1  Advanced Prospecting &amp; Detecting for Hardr...   
2                  Pulled Thread Embroidery Stitches   
3  Deceptively Delicious: Simple Secrets t

                                           category tech1 description fit  \
0  [Books, Comics & Graphic Novels, Graphic Novels]                []       
1  [Books, Comics & Graphic Novels, Graphic Novels]                []       
2  [Books, Comics & Graphic Novels, Graphic Novels]                []       
3  [Books, Comics & Graphic Novels, Graphic Novels]                []       
4  [Books, Comics & Graphic Novels, Graphic Novels]                []       

                                               title  \
0   Star Trek/Legion of Super-Heroes #5 (of 6) eBook   
1                                          Star Trek   
2   Star Trek/Legion of Super-Heroes #1 (of 6) eBook   
3                                          Star Trek   
4                                          Star Trek   

                                            also_buy image tech2  \
0  [B00N13TJUK, B00N13TKWC, B00N13TJ50, B00N13TJL...    []         
1   [B00N13TNX8, B00N13TO1Y, B00N13TOUK, B00N13TPNG]    []      

                                            category tech1 description fit  \
0   [CDs & Vinyl, Rap & Hip-Hop, Gangsta & Hardcore]                []       
1  [CDs & Vinyl, World Music, Europe, Continental...                []       
2       [CDs & Vinyl, Christian, Pop & Contemporary]                []       
3  [CDs & Vinyl, Alternative Rock, Hardcore & Pun...                []       
4                               [CDs & Vinyl, Blues]                []       

                   title                                          also_buy  \
0     Laugh &amp; a Half                          [B000002NXL, B00005N8SQ]   
1      Petra En Alabanza                                      [B079J855W1]   
2  Celebrate &amp; Party  [B00000313D, B00001YVD3, B00000312U, B000005OJX]   
3        Meat Your Maker                                      [B00000I9EC]   
4              Slow Burn  [B000SBA0NI, B00000DTX9, B000007SI5, B002S39CPG]   

                                               image tech2    

                                            category tech1  \
0       [CDs & Vinyl, Christian, Pop & Contemporary]         
1           [CDs & Vinyl, Dance & Electronic, House]         
2                         [CDs & Vinyl, Jazz, Bebop]         
3  [CDs & Vinyl, Alternative Rock, Goth & Industr...         
4            [CDs & Vinyl, Metal, Alternative Metal]         

                                         description fit  \
0  [1. Change - Sierra, Beck, Joe [Jazz]  \n2. Th...       
1  [Sonique ~ Hear My Cry, A pair of uptempo, min...       
2  [Tabla, sitar, dulcimer and other Eastern inst...       
3                                                 []       
4                                                 []       

                        title  \
0                      Change   
1                 Hear My Cry   
2  Best Of The Vanguard Years   
3                  Black Aria   
4                   Sacrifice   

                                            also_buy  \
0   [B00005

                                            category tech1  \
0              [CDs & Vinyl, Jazz, New Orleans Jazz]         
1  [CDs & Vinyl, Alternative Rock, New Wave & Pos...         
2                               [CDs & Vinyl, Metal]         
3            [CDs & Vinyl, Pop, Oldies, Girl Groups]         
4  [CDs & Vinyl, World Music, South & Central Ame...         

                                         description fit  \
0                                                 []       
1  [Import re-issue of Nick Cave's pre-Birthday P...       
2                                                 []       
3                                                 []       
4   [European Version; Features Three Bonus Tracks.]       

                                               title  \
0                                        Weary Blues   
1                                          Door Door   
2                                    Freak of Nature   
3  Under The Influence - The Original Vers

                                            category tech1  \
0  [CDs & Vinyl, Alternative Rock, New Wave & Pos...         
1          [CDs & Vinyl, Dance & Electronic, Techno]         
2  [CDs & Vinyl, Alternative Rock, British Altern...         
3  [CDs & Vinyl, Folk, British & Celtic Folk, Iri...         
4              [CDs & Vinyl, Pop, Adult Alternative]         

                                         description fit  \
0                 [DVD is NTSC region code 0 format]       
1  [TRACKLISTING: 01.MOUNTAIN 02.TAO NR. 43 03.DI...       
2  [The Manic Street Preachers return with LifeBl...       
3  [Irish band, The Pogues, bring their infectiou...       
4  [Featuring the 2 extra tracks: 'Disoriented', ...       

                                 title  \
0          Culture Club: Greatest Hits   
1                          Colour Haze   
2                            Lifeblood   
3  Live at the Town &amp; Country Club   
4                    Mistaken Identity   

             

                                            category tech1  \
0               [CDs & Vinyl, Classical, Symphonies]         
1                                [CDs & Vinyl, Jazz]         
2                                [CDs & Vinyl, Jazz]         
3                         [CDs & Vinyl, World Music]         
4  [CDs & Vinyl, World Music, Europe, Continental...         

                                         description fit  \
0  [I will ship by EMS or SAL items in stock in J...       
1  [Amazing 100 CD Set of containing a plethora o...       
2  [Awesome 100 CD set containing a plethora of c...       
3  [Spanning the boundaries of Folk and Jazz, Sco...       
4                                                 []       

                                               title  \
0  The Masters of Music - More than 250 works of ...   
1  King Oliver, Frank Teschemacher, Duke Ellingto...   
2  Worlds Greatest Jazz Collection: Big Bands - T...   
3                                        R

                                            category tech1  \
0                           [CDs & Vinyl, R&B, Soul]         
1                                 [CDs & Vinyl, Pop]         
2            [CDs & Vinyl, Children's Music, Disney]         
3  [CDs & Vinyl, Classical, Forms & Genres, Conce...         
4                                 [CDs & Vinyl, Pop]         

                                         description fit  \
0  [This 24k audiophile gold disc reissue of Sly ...       
1  [Live at Third Man Records 10-8-2012 The Shins...       
2  [Bring home The Little Mermaid Greatest Hits, ...       
3  [Antonio Pompa-Baldi has recorded over 15 albu...       
4  [2013 four CD set filled with classic cuts fro...       

                                               title  \
0               Theres a Riot Going on: Gold Edition   
1                Live at Third Man Records 10-8-2012   
2                  The Little Mermaid: Greatest Hits   
3  Grieg: Piano Concerto in A minor, Op. 1

                                            category tech1  \
0  [Electronics, Camera &amp; Photo, Film Photogr...         
1  [Electronics, Camera &amp; Photo, Film Photogr...         
2  [Electronics, Camera & Photo, Film Photography...         
3  [Electronics, Camera & Photo, Film Photography...         
4  [Electronics, Camera & Photo, Film Photography...         

                                         description fit  \
0  [With razor-sharp 38-135mm 3.6x power zoom len...       
1  [Sure Shot Canon pre owned. In working conditi...       
2  [The Canon Sure Shot 105 Zoom is an automatic ...       
3  [The Pentax IQZoom EZY-R is a simple point-and...       
4  [Pentax IQZoom 140M QD 35mm Point &amp; Shoot ...       

                                     title  \
0    Canon Sure Shot Z135 Zoom 35mm Camera   
1      Canon Sure Shot Tele 80 35mm Camera   
2     Canon Sure Shot 105 Zoom 35mm Camera   
3    Pentax IQ Zoom EZY-R 35mm Zoom Camera   
4  Pentax IQ Zoom 140M QD Date 35mm 

                                            category  \
0  [Electronics, Accessories & Supplies, Audio & ...   
1  [Electronics, Computers & Accessories, Data St...   
2  [Electronics, Computers & Accessories, Laptop ...   
3              [Electronics, Portable Audio & Video]   
4       [Electronics, Headphones, Earbud Headphones]   

                                               tech1  \
0                                                      
1   class="a-keyvalue prodDetTable" role="present...   
2                                                      
3   class="a-keyvalue prodDetTable" role="present...   
4                                                      

                                         description fit  \
0  [The SES-A-V-SYNC, also sometimes referred to ...       
1  [Buffalo's Drive Station DDR is an easy to use...       
2                                                 []       
3                                                 []       
4  [Precision-cut metal ho

                                            category  \
0  [Electronics, Computers & Accessories, Compute...   
1  [Electronics, Computers & Accessories, Laptop ...   
2  [Electronics, Computers & Accessories, Compute...   
3  [Electronics, Computers & Accessories, Laptop ...   
4  [Electronics, Camera & Photo, Lighting & Studi...   

                                               tech1  \
0                                                      
1                                                      
2   class="a-keyvalue prodDetTable" role="present...   
3   class="a-keyvalue prodDetTable" role="present...   
4   class="a-keyvalue prodDetTable" role="present...   

                                         description fit  \
0  [Want to read and write DVDs and CDs in less t...       
1  [Compatible Models \n<br /> Important compatib...       
2  [ASUS is glad to introduce the new X99 Series ...       
3  [<b>This Sophisticated and Chic Premium Diamon...       
4  [Description \n<br>The 

                                            category tech1  \
0  [Electronics, Accessories & Supplies, Audio & ...         
1  [Electronics, Accessories & Supplies, Audio & ...         
2                          [Electronics, Home Audio]         
3  [Electronics, Computers & Accessories, Compute...         
4  [Electronics, Computers & Accessories, Data St...         

                                         description fit  \
0  [Pilot's patented and exclusive Electrolumines...       
1  [Perfect for replacing your misplaced, damaged...       
2  [The Flexson floor stand for the new SONOS PLA...       
3  [Capture and store all your memories with the ...       
4  [From our Antique Collection, we are introduci...       

                                               title  \
0  Pilot Electronics EL-1301BWK Auxiliary Music S...   
1  SF Cable 6ft Ultra Low Profile Angle NEMA 5-15...   
2  Flexson Floor Stand for New Second Generation ...   
3  4 Pack SanDisk 8 GB Class 4 SD HC Flash

                                            category tech1 description fit  \
0  [Kindle Store, Kindle eBooks, Literature & Fic...                []       
1  [Kindle Store, Kindle eBooks, Science Fiction ...                []       
2  [Kindle Store, Kindle eBooks, Literature & Fic...                []       
3   [Kindle Store, Kindle eBooks, Sports & Outdoors]                []       
4  [Kindle Store, Kindle eBooks, Science Fiction ...                []       

                                               title  \
0                       Nakedella 2 - Kindle edition   
1   The Dragon&#39;s Flame (The Chronicles of Ter...   
2            The Road to Santiago (Directions) eBook   
3   Survival Manual US Army 2002 and U.S. Army Ra...   
4   Emerald D.A.R.E. (D.A.R.E. Project Book 3) eBook   

                                            also_buy image tech2  \
0  [B07L8F4VC5, B07MKBJ68L, B07FS7JTDW, B07K5XQT6...    []         
1  [B010EB2TA8, B0047O2BXO, B01LAAZ2BU, B07FC39RN...    []

                                            category tech1 description fit  \
0              [Kindle Store, Kindle eBooks, Travel]                []       
1  [Kindle Store, Kindle eBooks, Science Fiction ...                []       
2  [Kindle Store, Kindle eBooks, Literature & Fic...                []       
3  [Kindle Store, Kindle eBooks, Literature & Fic...                []       
4  [Kindle Store, Kindle eBooks, Literature & Fic...                []       

                                               title  \
0                                    Alaska Traveler   
1                            Tales from the Archives   
2           A Different Witch (A Modern Witch Series   
3  Home (gay, billionaire, werewolf, secret lover...   
4  The Holland Family Saga Part Five: Ghost Town ...   

                                            also_buy image tech2  \
0  [B06WGQ3HVK, B004HIM7CK, B004HIM7BG, B004Y1QBU...    []         
1  [B00CDUYW2W, B00KRTG00S, B008CG6KYO, B005Q3767...    []

                                            category tech1 description fit  \
0  [Kindle Store, Kindle eBooks, Literature & Fic...                []       
1  [Kindle Store, Kindle eBooks, Literature & Fic...                []       
2  [Kindle Store, Kindle eBooks, Parenting & Rela...                []       
3  [Kindle Store, Kindle eBooks, Mystery, Thrille...                []       
4  [Kindle Store, Kindle eBooks, Religion & Spiri...                []       

                                               title  \
0  The Scandalous Love of a Duke (Marlow Intrigue...   
1  Plague of Mybyncia (Arizal Wars Book 2) - Kind...   
2                                  Escaping the Cult   
3  Drowning the Daffodils (Heavenly Highland Inn ...   
4  Spirit Guides: Contact Your Spirit Guides &amp...   

                                            also_buy image tech2  \
0  [B00FVE4RXG, B00F240EKU, B00OXHFR6S, B00SS45A3...    []         
1                           [B00IQJK9WQ, B07CTZTBSW]    []

                                            category tech1 description fit  \
0             [Kindle Store, Kindle eBooks, Romance]                []       
1  [Kindle Store, Kindle eBooks, Science Fiction ...                []       
2             [Kindle Store, Kindle eBooks, Romance]                []       
3  [Kindle Store, Kindle eBooks, Mystery, Thrille...                []       
4    [Kindle Store, Kindle eBooks, Business & Money]                []       

                                               title  \
0            Pride Series Books 4-6 - Kindle edition   
1                                 Death in Neverland   
2       The Secret Series Books 4-6 - Kindle edition   
3  Imagineered Death (The DW Mysteries Book 3) - ...   
4                                            Destiny   

                                            also_buy image tech2  \
0  [B01LZABST9, B00DDVLR7I, B00B1TLLIY, B07CCH63C...    []         
1   [B01BUN41NW, B01M8QJITR, B07BBXD8KJ, B01FJ2E96O]    []

                                            category tech1 description fit  \
0  [Kindle Store, Kindle eBooks, Mystery, Thrille...                []       
1      [Kindle Store, Kindle eBooks, Science & Math]                []       
2  [Kindle Store, Kindle eBooks, Health, Fitness ...                []       
3  [Kindle Store, Kindle eBooks, Religion & Spiri...                []       
4  [Kindle Store, Kindle eBooks, Literature & Fic...                []       

                                               title  \
0  Murder, Trouble &amp; Family: An Annie Ryan Co...   
1  ebook,Kevin J. Cheek,Learning the Metric Syste...   
2  Sciatica: The Ultimate Guide To Sciatica Pain ...   
3       The Light Through the Water - Kindle edition   
4  How to Train Her Curves (Training Her Curves E...   

                                            also_buy image tech2  \
0                                       [B06XRRRHVY]    []         
1  [B0763JXJCG, B00HUGJPSK, B000SEHP06, B06XQMNKQ...    []

                                            category tech1 description fit  \
0   [Kindle Store, Kindle eBooks, Children's eBooks]                []       
1  [Kindle Store, Kindle eBooks, Literature & Fic...                []       
2             [Kindle Store, Kindle eBooks, History]                []       
3  [Kindle Store, Kindle eBooks, Literature & Fic...                []       
4  [Kindle Store, Kindle eBooks, Teen & Young Adult]                []       

                                               title  \
0  Rich Dad&#39;s Escape from the Rat Race: How T...   
1                Caught Me Dreaming - Kindle edition   
2  Bound to Lead: The Changing Nature of American...   
3     I Won&#39;t Stop Loving You 2 - Kindle edition   
4   Packet Trade (Devi Jones&#39; Locker Book 1) ...   

                                            also_buy image tech2  \
0  [B017QL9AIS, B0175P5O9E, B015X2PG3K, B01DRWRZ6...    []         
1  [B07L2GJL6L, B07DFQXPX3, B07HS2C1C2, B07FNFFM7...    []

                                            category tech1  \
0  [Sports & Outdoors, Sports & Fitness, Boating ...         
1  [Sports & Outdoors, Fan Shop, Auto Accessories...         
2  [Sports & Outdoors, Outdoor Recreation, Campin...         
3  [Sports & Outdoors, Outdoor Recreation, Outdoo...         
4  [Sports & Outdoors, Outdoor Recreation, Climbi...         

                                         description fit  \
0  [Coghlan's All Weather Wallet is ideal for hun...       
1   [NCAA University Of Arkansas Car Mats (2-Piece)]       
2  [Ideal for backcountry camping, wilderness bac...       
3  [These bolle fang sunglasses are the ideal cho...       
4  [The ultimate hybrid Axe for technical couloir...       

                                               title  \
0                       Coghlan's All Weather Wallet   
1                        Arkansas Car Mats (2-Piece)   
2       Coghlan's Drinking Water Treatment, Two Step   
3  Bolle Sport Fang Sunglasses (Dark Torto

                                            category tech1  \
0  [Sports & Outdoors, Sports & Fitness, Hunting ...         
1  [Sports & Outdoors, Sports & Fitness, Hunting ...         
2  [Sports & Outdoors, Sports & Fitness, Hunting ...         
3  [Sports & Outdoors, Sports & Fitness, Airsoft ...         
4  [Sports & Outdoors, Sports & Fitness, Airsoft ...         

                                         description fit  \
0  [Cleaning your firearms just got a whole lot e...       
1  [, When you are running, walking your dog, or ...       
2                                                 []       
3  [Leupold Rifleman See-Thru Mount Gloss Rings ....       
4  [The AD-RECON mount is made for putting high p...       

                                               title  \
0  Birchwood Casey BC33344 Gun Scrubber Synthetic...   
1  SABRE Red Runner Pepper Gel - Police Strength ...   
2  Magpul USGI 223 Ranger Plate Floorplate Loop (...   
3  Leupold Rifleman See-thru Ring Mounts .

                                            category tech1  \
0  [Sports & Outdoors, Fan Shop, Sports Souvenirs...         
1  [Sports & Outdoors, Fan Shop, Patio, Lawn & Ga...         
2  [Sports & Outdoors, Fan Shop, Patio, Lawn & Ga...         
3  [Sports & Outdoors, Fan Shop, Patio, Lawn & Ga...         
4  [Sports & Outdoors, Fan Shop, Sports Souvenirs...         

                                         description fit  \
0  [Country: England #75646 Wish them happy birth...       
1  [Our Texas Tech Red Raiders Flag measures 3x5 ...       
2  [Our Miami Hurricanes Flag measures 3x5 feet i...       
3  [Our Michigan State University Flag measures 3...       
4                                [Barcelona lanyard]       

                                               title  \
0                 Chelsea F.C. MUSICAL Birthday Card   
1  TTU Texas Tech Red Raiders University Large Co...   
2  Miami Hurricanes UM Canes University Large Col...   
3  MSU White Michigan State Spartans Unive

                                            category tech1  \
0  [Sports & Outdoors, Sports & Fitness, Exercise...         
1  [Sports & Outdoors, Sports & Fitness, Exercise...         
2  [Sports & Outdoors, Sports & Fitness, Leisure ...         
3  [Sports & Outdoors, Sports & Fitness, Leisure ...         
4  [Sports & Outdoors, Sports & Fitness, Leisure ...         

                                         description  \
0  [These Running Shorts are a lightweight traini...   
1  [These Running Shorts are a lightweight traini...   
2                 [Jump Caddy (Large) Length: 7 in.]   
3  [Ultimate Pool Challenge Billiards Card Game T...   
4  [After months of trial and error and extensive...   

                                                 fit  \
0   class="a-normal a-align-center a-spacing-smal...   
1   class="a-normal a-align-center a-spacing-smal...   
2                                                      
3                                                      
4         

                                            category tech1  \
0  [Sports & Outdoors, Outdoor Recreation, Cyclin...         
1  [Sports & Outdoors, Outdoor Recreation, Cyclin...         
2  [Sports & Outdoors, Outdoor Recreation, Cyclin...         
3  [Sports & Outdoors, Outdoor Recreation, Cyclin...         
4  [Sports & Outdoors, Outdoor Recreation, Cyclin...         

                                         description fit  \
0  [With the new Race Face Cinch PF30 bottom brac...       
1  [Custom 19 ball flanged retainer bearings<br><...       
2  [Attaches as part of the RF Cinch system (usin...       
3  [* Durable aluminum housing won't kink or rust...       
4  [Maybe you descend like a maniac and never use...       

                                          title  \
0            RaceFace Cinch PF30 Bottom Bracket   
1  Race Face Bottom Bracket BB92/89.5/104.5/107   
2                    RaceFace Spider Bike Cinch   
3      Jagwire Road Elite Link Brake Kit Silver   
4     Jagwi

                                            category tech1  \
0  [Sports & Outdoors, Sports & Fitness, Other Sp...         
1  [Sports & Outdoors, Sports & Fitness, Other Sp...         
2  [Sports & Outdoors, Sports & Fitness, Accessor...         
3  [Sports & Outdoors, Sports & Fitness, Other Sp...         
4  [Sports & Outdoors, Sports & Fitness, Other Sp...         

                                         description  \
0  [These Kung Fu shoes are perfect for Kung Fu t...   
1  [These Kung Fu shoes are perfect for Kung Fu t...   
2  [Official Gatorade squeeze bottle. Ideal for t...   
3  [These Kung Fu shoes are perfect for Kung Fu t...   
4  [These Kung Fu shoes are perfect for Kung Fu t...   

                                                 fit  \
0   class="a-normal a-align-center a-spacing-smal...   
1   class="a-normal a-align-center a-spacing-smal...   
2                                                      
3   class="a-normal a-align-center a-spacing-smal...   
4   class=

                                            category tech1  \
0  [Sports & Outdoors, Outdoor Recreation, Campin...         
1  [Sports & Outdoors, Outdoor Recreation, Campin...         
2  [Sports & Outdoors, Outdoor Recreation, Campin...         
3  [Sports & Outdoors, Outdoor Recreation, Outdoo...         
4  [Sports & Outdoors, Outdoor Recreation, Campin...         

                                         description  \
0  [At Goodhew we are committed to crafting lifes...   
1  [At Goodhew we are committed to crafting lifes...   
2  [At Goodhew we are committed to crafting lifes...   
3  [At Goodhew we are committed to crafting lifes...   
4  [Sockwell is reinventing the therapeutic sock,...   

                                                 fit  \
0                                                      
1                                                      
2   class="a-normal a-align-center a-spacing-smal...   
3                                                      
4   class=

In [4]:
import json
import pandas as pd
from bs4 import BeautifulSoup
import re
from nltk.corpus import stopwords
from nltk.tokenize import word_tokenize
import os

# Function to clean text
def clean_text(text):
    # Remove HTML tags
    text = BeautifulSoup(text, "html.parser").get_text()
    # Remove non-alphanumeric characters and convert to lowercase
    text = re.sub(r'[^a-zA-Z\s]', '', text).lower()
    # Tokenize the text
    tokens = word_tokenize(text)
    # Remove stopwords
    stop_words = set(stopwords.words('english'))
    tokens = [word for word in tokens if word not in stop_words]
    # Join tokens back into a string
    clean_text = ' '.join(tokens)
    return clean_text

# Function to preprocess data
def preprocess_data(df):
    # Ensure 'description' column contains strings
    df['description'] = df['description'].astype(str)
    
    # Clean 'description' column
    df['description'] = df['description'].apply(clean_text)
    
    # Convert 'price' column to numerical
    df['price'] = df['price'].str.extract(r'\b(\d+\.\d+)\b').astype(float)
    
    # Extract main category from 'category' column
    df['main_category'] = df['category'].apply(lambda x: x[0])
    
    # Drop irrelevant columns
    df.drop(['tech1', 'tech2', 'details', 'similar_item', 'category'], axis=1, inplace=True)
    
    return df



# Load Sampled Amazon dataset
df_chunks = pd.read_json('Sampled_Amazon_Meta.json', lines=True, chunksize=10000)

# Preprocess and write to a new JSON file
output_file = 'preprocessed_amazon_data.json'
with open(output_file, 'w') as f:
    for i, df_chunk in enumerate(df_chunks):
        preprocessed_df_chunk = preprocess_data(df_chunk)
        preprocessed_df_chunk.to_json(f, orient='records', lines=True)
        print(f"Processed chunk {i+1}")

print("Preprocessing complete.")

# Bonus: Perform batch processing in real-time
# Monitor a directory for new files and preprocess them as they arrive
input_directory = 'incoming_data'
output_directory = 'preprocessed_data'
os.makedirs(output_directory, exist_ok=True)

while True:
    # Check for new files in the input directory
    files = os.listdir(input_directory)
    for file in files:
        if file.endswith('.json'):
            input_file = os.path.join(input_directory, file)
            output_file = os.path.join(output_directory, file)
            df = pd.read_json(input_file, lines=True)
            preprocessed_df = preprocess_data(df)
            preprocessed_df.to_json(output_file, orient='records', lines=True)
            print(f"Preprocessed file {file} and saved as {output_file}")
            os.remove(input_file)  # Remove the processed file from the input directory
    time.sleep(60)  # Check for new files every 60 seconds




Processed chunk 1




Processed chunk 2




Processed chunk 3




Processed chunk 4




Processed chunk 5




Processed chunk 6




Processed chunk 7




Processed chunk 8




Processed chunk 9




Processed chunk 10




Processed chunk 11




Processed chunk 12




Processed chunk 13




Processed chunk 14




Processed chunk 15




Processed chunk 16




Processed chunk 17




Processed chunk 18




Processed chunk 19




Processed chunk 20




Processed chunk 21




Processed chunk 22




Processed chunk 23




Processed chunk 24




Processed chunk 25




Processed chunk 26




Processed chunk 27




Processed chunk 28




Processed chunk 29




Processed chunk 30




Processed chunk 31




Processed chunk 32




Processed chunk 33




Processed chunk 34




Processed chunk 35




Processed chunk 36




Processed chunk 37




Processed chunk 38




Processed chunk 39




Processed chunk 40




Processed chunk 41




Processed chunk 42




Processed chunk 43




Processed chunk 44




Processed chunk 45




Processed chunk 46




Processed chunk 47




Processed chunk 48




Processed chunk 49




Processed chunk 50




Processed chunk 51




Processed chunk 52




Processed chunk 53




Processed chunk 54




Processed chunk 55




Processed chunk 56




Processed chunk 57




Processed chunk 58




Processed chunk 59




Processed chunk 60




Processed chunk 61




Processed chunk 62




Processed chunk 63




Processed chunk 64




IndexError: list index out of range