2022-11-12 06:01:24 +03:00
|
|
|
import os
|
|
|
|
import torch
|
|
|
|
import argparse
|
|
|
|
|
|
|
|
|
2023-06-23 05:58:20 +03:00
|
|
|
parser = argparse.ArgumentParser(description="Pruning")
|
|
|
|
parser.add_argument("--ckpt", type=str, default=None, help="path to model ckpt")
|
2022-11-12 06:01:24 +03:00
|
|
|
args = parser.parse_args()
|
|
|
|
ckpt = args.ckpt
|
|
|
|
|
2023-06-23 05:58:20 +03:00
|
|
|
|
2022-11-12 06:01:24 +03:00
|
|
|
def prune_it(p, keep_only_ema=False):
|
|
|
|
print(f"prunin' in path: {p}")
|
|
|
|
size_initial = os.path.getsize(p)
|
|
|
|
nsd = dict()
|
|
|
|
sd = torch.load(p, map_location="cpu")
|
|
|
|
print(sd.keys())
|
|
|
|
for k in sd.keys():
|
|
|
|
if k != "optimizer_states":
|
|
|
|
nsd[k] = sd[k]
|
|
|
|
else:
|
|
|
|
print(f"removing optimizer states for path {p}")
|
|
|
|
if "global_step" in sd:
|
|
|
|
print(f"This is global step {sd['global_step']}.")
|
|
|
|
if keep_only_ema:
|
|
|
|
sd = nsd["state_dict"].copy()
|
|
|
|
# infer ema keys
|
2023-06-23 05:58:20 +03:00
|
|
|
ema_keys = {
|
|
|
|
k: "model_ema." + k[6:].replace(".", ".")
|
|
|
|
for k in sd.keys()
|
|
|
|
if k.startswith("model.")
|
|
|
|
}
|
2022-11-12 06:01:24 +03:00
|
|
|
new_sd = dict()
|
|
|
|
|
|
|
|
for k in sd:
|
|
|
|
if k in ema_keys:
|
|
|
|
new_sd[k] = sd[ema_keys[k]].half()
|
2023-06-23 05:58:20 +03:00
|
|
|
elif not k.startswith("model_ema.") or k in [
|
|
|
|
"model_ema.num_updates",
|
|
|
|
"model_ema.decay",
|
|
|
|
]:
|
2022-11-12 06:01:24 +03:00
|
|
|
new_sd[k] = sd[k].half()
|
|
|
|
|
|
|
|
assert len(new_sd) == len(sd) - len(ema_keys)
|
|
|
|
nsd["state_dict"] = new_sd
|
|
|
|
else:
|
2023-06-23 05:58:20 +03:00
|
|
|
sd = nsd["state_dict"].copy()
|
2022-11-12 06:01:24 +03:00
|
|
|
new_sd = dict()
|
|
|
|
for k in sd:
|
|
|
|
new_sd[k] = sd[k].half()
|
2023-06-23 05:58:20 +03:00
|
|
|
nsd["state_dict"] = new_sd
|
2022-11-12 06:01:24 +03:00
|
|
|
|
2023-06-23 05:58:20 +03:00
|
|
|
fn = (
|
|
|
|
f"{os.path.splitext(p)[0]}-pruned.ckpt"
|
|
|
|
if not keep_only_ema
|
|
|
|
else f"{os.path.splitext(p)[0]}-ema-pruned.ckpt"
|
|
|
|
)
|
2022-11-12 06:01:24 +03:00
|
|
|
print(f"saving pruned checkpoint at: {fn}")
|
|
|
|
torch.save(nsd, fn)
|
|
|
|
newsize = os.path.getsize(fn)
|
2023-06-23 05:58:20 +03:00
|
|
|
MSG = (
|
|
|
|
f"New ckpt size: {newsize*1e-9:.2f} GB. "
|
|
|
|
+ f"Saved {(size_initial - newsize)*1e-9:.2f} GB by removing optimizer states"
|
|
|
|
)
|
2022-11-12 06:01:24 +03:00
|
|
|
if keep_only_ema:
|
|
|
|
MSG += " and non-EMA weights"
|
|
|
|
print(MSG)
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
2023-06-23 05:58:20 +03:00
|
|
|
prune_it(ckpt)
|