import math
import time
import statistics
import numpy as np

n = 300_000
wages_list = [10 + 20 * math.sin(i / 3000) + (i % 7) for i in range(n)]
wages_array = np.array(wages_list)
len(wages_list), wages_array.shape

def score_loop(x):
    out = []
    for value in x:
        out.append(math.log(1 + value**2))
    return out

def score_list_comp(x):
    return [math.log(1 + value**2) for value in x]

def score_numpy(x):
    return np.log(1 + x**2)

def benchmark(func, obj, repeats=3):
    timings = []
    for _ in range(repeats):
        t0 = time.perf_counter()
        func(obj)
        timings.append(time.perf_counter() - t0)
    return {
        "mean_seconds": round(statistics.mean(timings), 4),
        "min_seconds": round(min(timings), 4),
        "max_seconds": round(max(timings), 4)
    }

results = {
    "loop": benchmark(score_loop, wages_list),
    "list_comprehension": benchmark(score_list_comp, wages_list),
    "numpy_vectorized": benchmark(score_numpy, wages_array)
}
results

ids = list(range(200_000))
id_set = set(ids)
id_dict = {i: True for i in ids}
queries = list(range(150_000, 250_000))

def count_membership(container, queries):
    c = 0
    for q in queries:
        if q in container:
            c += 1
    return c

membership_results = {
    "list": benchmark(count_membership, ids),
    "set": benchmark(count_membership, id_set),
    "dict": benchmark(count_membership, id_dict)
}
membership_results

researchers_bad = [
    ["Ana", "macro", 3],
    ["Luca", "labor", 1],
    ["Mina", "text", 4]
]

researchers_good = [
    {"name": "Ana", "field": "macro", "projects": 3},
    {"name": "Luca", "field": "labor", "projects": 1},
    {"name": "Mina", "field": "text", "projects": 4},
]

print("Opaque access:", researchers_bad[0][2])
print("Readable access:", researchers_good[0]["projects"])

Extra L2 — Data Structures, Complexity, and Vectorization¶

Goal¶

Why this matters¶

1. A simple problem¶

Interpretation¶

2. Membership tests: list vs set vs dictionary¶

Why this matters¶

3. Reliability and structure¶

4. Short exercise¶

Optional extension¶