In [6]:
import pandas as pd
import os
from IPython.display import display
# Robust CSV discovery and loading
target_filename = 'wetter.csv'
# Start searching common places (project root and ./data)
search_roots = [os.path.join(os.getcwd(), 'data'), os.path.join(os.getcwd())]
found_paths = []
for root in search_roots:
    if os.path.exists(root):
        for dirpath, dirnames, filenames in os.walk(root):
            if target_filename in filenames:
                found_paths.append(os.path.join(dirpath, target_filename))
# As a final fallback, scan the entire workspace once
if not found_paths:
    for dirpath, dirnames, filenames in os.walk(os.getcwd()):
        if target_filename in filenames:
            found_paths.append(os.path.join(dirpath, target_filename))
df = None
if not found_paths:
    print(f'Could not find `{target_filename}` in the workspace.')
    print("Place the file under `./data/` or upload it via VS Code Explorer.")
else:
    path = found_paths[0]
    print(f'Found file: {path}')
    # Try multiple encodings and separators to be resilient with CSV format
    encodings = ['utf-8', 'latin-1', 'cp1252']
    seps = [';', ',', '\t']
    loaded = False
    last_error = None
    for enc in encodings:
        for sep in seps:
            try:
                df = pd.read_csv(path, sep=sep, encoding=enc)
                print(f'Loaded CSV with encoding={enc!r}, sep={sep!r}')
                loaded = True
                break
            except Exception as e:
                last_error = e
        if loaded:
            break
    if not loaded:
        print('Failed to parse CSV with tried encodings/separators. Last error:')
        print(last_error)
# If loaded, show a small preview and shape
if df is not None:
    display(df.head())
    print(f'DataFrame shape: {df.shape}')
else:
    print('No DataFrame was loaded.')

Found file: /workspaces/Group/data/wetter.csv
Loaded CSV with encoding='utf-8', sep=';'


Unnamed: 0,"Datum,Bewoelkung,Temperatur,Windgeschwindigkeit,Wettercode"
0,"2012-01-01,8,9.825,14,58"
1,"2012-01-02,7,7.4375,12,"
2,"2012-01-03,8,5.5375,18,63"
3,"2012-01-04,4,5.6875,19,80"
4,"2012-01-05,6,5.3,23,80"


DataFrame shape: (2601, 1)
