-
Notifications
You must be signed in to change notification settings - Fork 2
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
1 parent
999ba7c
commit a49f620
Showing
3 changed files
with
127 additions
and
48 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,40 +1,111 @@ | ||
from pathlib import Path | ||
|
||
from plotly.subplots import make_subplots | ||
import plotly.graph_objects as go | ||
import pandas as pd | ||
import torch | ||
from torchvision.datasets import CIFAR10 | ||
from torchvision.transforms.v2.functional import to_tensor | ||
from polyapprox.ols import ols | ||
from mdl.mlp_probe import MlpProbe | ||
import lovely_tensors as lt | ||
|
||
lt.monkey_patch() | ||
|
||
def get_cifar10_mean(): | ||
nontest = CIFAR10("/home/lucia/cifar10", download=True) | ||
def plot(ols_results, filename='polyapprox_mlp_fvu'): | ||
# Plot FVU over checkpoints - the final number in each name is the checkpoints | ||
fvu = [] | ||
checkpoint = [] | ||
eraser = [] | ||
for key, value in ols_results.items(): | ||
if value.fvu < -0.01: | ||
print(f"{key} has FVU {value.fvu}. Skipping.") | ||
continue | ||
|
||
images, labels = zip(*nontest) | ||
X = torch.stack(list(map(to_tensor, images))) | ||
X = X.view(X.shape[0], -1) | ||
fvu.append(value.fvu) | ||
chunks = key[:-4].split("-") | ||
checkpoint.append(int(chunks[-1])) | ||
eraser.append(chunks[0].split(" ")[0]) | ||
|
||
return X.mean(dim=0) | ||
df = pd.DataFrame({"fvu": fvu, "checkpoint": checkpoint, "eraser": eraser}) | ||
df = df.sort_values(by="checkpoint") | ||
|
||
fig = make_subplots(rows=len(df.eraser.unique()), cols=1) | ||
|
||
# Load each MLP checkpoint ols | ||
for row, eraser in enumerate(df.eraser.unique(), start=1): | ||
df_eraser = df[df.eraser == eraser] | ||
fig.add_trace(go.Scatter(x=df_eraser.checkpoint, y=df_eraser.fvu, mode="lines", name=eraser), row=row, col=1) | ||
|
||
fig.update_layout(title="FVU over checkpoints") | ||
fig.write_image(f"{filename}.pdf", format="pdf") | ||
|
||
# Load each MLP checkpoint ols | ||
out_path = Path("polyapprox_mlp.pth") | ||
ckpts = list(Path("probe-ckpts").glob("*.pth")) | ||
ols_results = [] | ||
ols_results = {} if not out_path.exists() else torch.load(out_path) | ||
plot(ols_results) | ||
|
||
|
||
def polyapprox_linear(ckpts): | ||
linear_results = {} | ||
for ckpt in ckpts: | ||
if "normalize" not in ckpt.name: | ||
continue | ||
|
||
if ckpt.name in ols_results: | ||
print(f"Skipping {ckpt.name} because it already exists") | ||
continue | ||
|
||
print(f"Processing {ckpt.name}") | ||
|
||
probe = MlpProbe( | ||
num_features=32 * 32 * 3, num_classes=10, hidden_size=128, num_layers=1 | ||
) | ||
probe.load_state_dict(torch.load(ckpt)) | ||
probe.eval() | ||
|
||
ols_results[ckpt.name] = ols( | ||
probe.net[0].weight.data.double().numpy(), | ||
probe.net[0].bias.data.double().numpy(), | ||
probe.net[2].weight.data.double().numpy(), | ||
probe.net[2].bias.data.double().numpy(), | ||
act="relu", | ||
order="quadratic", | ||
return_fvu=True, | ||
) | ||
print(f"FVU: {ols_results[ckpt.name].fvu}") | ||
# exit() | ||
torch.save(linear_results, out_path) | ||
plot(linear_results, filename="polyapprox_mlp_linear") | ||
|
||
polyapprox_linear(ckpts) | ||
exit() | ||
|
||
for ckpt in ckpts: | ||
if 'normalize' not in ckpt.name: | ||
if "normalize" not in ckpt.name: | ||
continue | ||
|
||
probe = MlpProbe(num_features=32*32*3, num_classes=10, hidden_size=128, num_layers=1) | ||
probe.load_state_dict(torch.load(ckpt)) | ||
probe.eval() | ||
if ckpt.name in ols_results: | ||
print(f"Skipping {ckpt.name} because it already exists") | ||
continue | ||
|
||
ols_results.append(ols( | ||
probe.net[0].weight.data.double().numpy(), probe.net[0].bias.data.double().numpy(), | ||
probe.net[2].weight.data.double().numpy(), probe.net[2].bias.data.double().numpy(), | ||
act="relu", order="quadratic", | ||
return_fvu=True | ||
)) | ||
print(f"Processing {ckpt.name}") | ||
|
||
torch.save(ols_results, "polyapprox_mlp.pth") | ||
|
||
probe = MlpProbe( | ||
num_features=32 * 32 * 3, num_classes=10, hidden_size=128, num_layers=1 | ||
) | ||
probe.load_state_dict(torch.load(ckpt)) | ||
probe.eval() | ||
# print("Biases: ", probe.net[0].bias.data.double(), probe.net[2].bias.data.double()) | ||
# continue | ||
|
||
ols_results[ckpt.name] = ols( | ||
probe.net[0].weight.data.double().numpy(), | ||
probe.net[0].bias.data.double().numpy(), | ||
probe.net[2].weight.data.double().numpy(), | ||
probe.net[2].bias.data.double().numpy(), | ||
act="relu", | ||
order="quadratic", | ||
return_fvu=True, | ||
) | ||
# exit() | ||
torch.save(ols_results, out_path) | ||
plot(ols_results) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters