python-mastery

# theory

reading

# Read entire file
with open("file.txt", "r") as f:
    content = f.read()

# Read lines into list
with open("file.txt", "r") as f:
    lines = f.readlines()

# Read line by line (memory efficient)
with open("file.txt", "r") as f:
    for line in f:
        print(line.strip())

writing

# Write (overwrites existing)
with open("output.txt", "w") as f:
    f.write("Hello, World!\n")

# Append to existing
with open("output.txt", "a") as f:
    f.write("Another line\n")

# Write multiple lines
lines = ["Line 1", "Line 2", "Line 3"]
with open("output.txt", "w") as f:
    f.writelines(line + "\n" for line in lines)

the with statement

Always use with to ensure files are properly closed:

# Good - file automatically closes
with open("file.txt") as f:
    data = f.read()

# Bad - you might forget to close
f = open("file.txt")
data = f.read()
f.close()  # Easy to forget!

file modes

Mode	Meaning
"r"	Read (default)
"w"	Write (overwrites)
"a"	Append
"x"	Create (fails if exists)
"b"	Binary mode
"r+"	Read and write

the csv module

import csv

# Read CSV
with open("data.csv") as f:
    reader = csv.reader(f)
    for row in reader:
        print(row)  # row is a list

# Read as dictionaries
with open("data.csv") as f:
    reader = csv.DictReader(f)
    for row in reader:
        print(row["column_name"])

# Write CSV
with open("output.csv", "w", newline="") as f:
    writer = csv.writer(f)
    writer.writerow(["Name", "Age"])
    writer.writerow(["Alice", 25])

loading real-size data

The browser can't read /Users/you/data.csv. But it can pyfetch a URL and feed the bytes to pd.read_csv or csv.DictReader through io.StringIO. That's how the examples below switch from 8-row toy CSVs to real datasets in the hundreds-to-thousands of rows.

import io
import pandas as pd
from pyodide.http import pyfetch

URL = "https://raw.githubusercontent.com/plotly/datasets/master/diabetes.csv"
resp = await pyfetch(URL)
df = pd.read_csv(io.StringIO(await resp.string()))
print(df.shape)  # (768, 9)

Any raw.githubusercontent.com URL is CORS-friendly. Plotly and Vega both maintain large dataset repos that work without auth.

# examples [4]

# example 01 · reading line by line

Process each line individually

1

2

3

4

5

6

7

8

9

10

🐍

Loading PythonSetting up pandas & numpy...

# example 02 · writing content

Write text to a file-like object

1

2

3

4

5

6

7

8

9

10

11

🐍

Loading PythonSetting up pandas & numpy...

# example 03 · CSV operations

Read and parse CSV data

1

2

3

4

5

6

7

8

9

10

11

12

🐍

Loading PythonSetting up pandas & numpy...

# example 04 · loading a real-size CSV via pyfetch

Fetch a 768-row public dataset and load it straight into pandas. Same code you'd write against a local file, swap open() for pyfetch + StringIO.

1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

import io
import pandas as pd
from pyodide.http import pyfetch

URL = "https://raw.githubusercontent.com/plotly/datasets/master/diabetes.csv"
resp = await pyfetch(URL)
df = pd.read_csv(io.StringIO(await resp.string()))

print(f"shape: {df.shape}")
print(f"columns: {list(df.columns)}")
print("\nfirst 5 rows:")
print(df.head())

print("\nsummary stats (Glucose, BloodPressure, BMI):")
print(df[["Glucose", "BloodPressure", "BMI"]].describe().round(1))

🐍

Loading PythonSetting up pandas & numpy...

# challenges [2]

# challenge 01/02todo

Read data='A:1\nB:2\nC:3' line by line, split each by ':', and print key-value pairs.

1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

import io

# Simulate file operations with StringIO
# (In browser, we can't access real files)

file_content = """Line 1: Hello
Line 2: World
Line 3: Python"""

# Read all content
f = io.StringIO(file_content)
all_text = f.read()
print("All content:")
print(all_text)

# Read lines
f = io.StringIO(file_content)
lines = f.readlines()
print("\nAs lines list:")
print(lines)


# Read data='A:1\nB:2\nC:3' line by line, split each by ':', and print key-value pairs.
# Your code here:

🐍

Loading PythonSetting up pandas & numpy...

# challenge 02/02todo

Use csv.DictReader to read 'name,score\nAlice,95\nBob,82' and print each name and score.

1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

import io

# Simulate file operations with StringIO
# (In browser, we can't access real files)

file_content = """Line 1: Hello
Line 2: World
Line 3: Python"""

# Read all content
f = io.StringIO(file_content)
all_text = f.read()
print("All content:")
print(all_text)

# Read lines
f = io.StringIO(file_content)
lines = f.readlines()
print("\nAs lines list:")
print(lines)


# Use csv.DictReader to read 'name,score\nAlice,95\nBob,82' and print each name and score.
# Your code here:

🐍

Loading PythonSetting up pandas & numpy...

# project

# project-challenge

thread: Sales Performance Dashboard · reward: 50 xp

# brief

Management wants a text summary of sales by region. Generate a report showing total revenue per region and write it to a file-like object for export.

# task

Write Sales Summary Report

# your code

1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

import pandas as pd
import io

sales_csv = """SaleID,SalesRep,Region,Product,Category,Quantity,UnitPrice,SaleDate,CustomerSegment
S001,Alice Chen,North,Widget Pro,Electronics,15,49.99,2023-01-05,Enterprise
S002,Bob Martinez,South,Gadget Plus,Tools,8,29.99,2023-01-08,SMB
S003,Carol Davis,East,Widget Pro,Electronics,22,49.99,2023-01-10,Enterprise
S004,Dan Wilson,West,Super Tool,Tools,45,19.99,2023-01-12,Consumer
S005,Eva Brown,North,Power Unit,Electronics,10,89.99,2023-01-15,Enterprise
S006,Alice Chen,North,Gadget Plus,Tools,30,29.99,2023-01-18,SMB
S007,Bob Martinez,South,Widget Pro,Electronics,18,49.99,2023-01-20,Consumer
S008,Carol Davis,East,Super Tool,Tools,55,19.99,2023-02-01,SMB
S009,Dan Wilson,West,Power Unit,Electronics,8,89.99,2023-02-05,Enterprise
S010,Eva Brown,North,Widget Basic,Electronics,65,24.99,2023-02-10,Consumer
S011,Alice Chen,North,Super Tool,Tools,40,19.99,2023-02-15,Consumer
S012,Bob Martinez,South,Power Unit,Electronics,12,89.99,2023-02-20,Enterprise
S013,Carol Davis,East,Gadget Plus,Tools,25,29.99,2023-03-01,SMB
S014,Dan Wilson,West,Widget Pro,Electronics,20,49.99,2023-03-05,Enterprise
S015,Eva Brown,North,Widget Basic,Electronics,80,24.99,2023-03-10,Consumer"""

sales = pd.read_csv(io.StringIO(sales_csv))

# Task:
# 1. Calculate revenue (Quantity * UnitPrice) for each sale
# 2. Group by Region and sum the revenue
# 3. Write a formatted report to a StringIO object
# 4. Print the report contents

import pandas as pd
import io

sales_csv = """SaleID,SalesRep,Region,Product,Category,Quantity,UnitPrice,SaleDate,CustomerSegment
S001,Alice Chen,North,Widget Pro,Electronics,15,49.99,2023-01-05,Enterprise
S002,Bob Martinez,South,Gadget Plus,Tools,8,29.99,2023-01-08,SMB
S003,Carol Davis,East,Widget Pro,Electronics,22,49.99,2023-01-10,Enterprise
S004,Dan Wilson,West,Super Tool,Tools,45,19.99,2023-01-12,Consumer
S005,Eva Brown,North,Power Unit,Electronics,10,89.99,2023-01-15,Enterprise
S006,Alice Chen,North,Gadget Plus,Tools,30,29.99,2023-01-18,SMB
S007,Bob Martinez,South,Widget Pro,Electronics,18,49.99,2023-01-20,Consumer
S008,Carol Davis,East,Super Tool,Tools,55,19.99,2023-02-01,SMB
S009,Dan Wilson,West,Power Unit,Electronics,8,89.99,2023-02-05,Enterprise
S010,Eva Brown,North,Widget Basic,Electronics,65,24.99,2023-02-10,Consumer
S011,Alice Chen,North,Super Tool,Tools,40,19.99,2023-02-15,Consumer
S012,Bob Martinez,South,Power Unit,Electronics,12,89.99,2023-02-20,Enterprise
S013,Carol Davis,East,Gadget Plus,Tools,25,29.99,2023-03-01,SMB
S014,Dan Wilson,West,Widget Pro,Electronics,20,49.99,2023-03-05,Enterprise
S015,Eva Brown,North,Widget Basic,Electronics,80,24.99,2023-03-10,Consumer"""

sales = pd.read_csv(io.StringIO(sales_csv))

# Task:
# 1. Calculate revenue (Quantity * UnitPrice) for each sale
# 2. Group by Region and sum the revenue
# 3. Write a formatted report to a StringIO object
# 4. Print the report contents

🐍

Loading PythonSetting up pandas & numpy...

File I/O

reading

writing

the with statement

file modes

the csv module

loading real-size data

Write Sales Summary Report