sander-wood
/

clamp2

Feature Extraction

Model card Files Files and versions Community

clamp2 / music_classification /inference_cls.py

sander-wood's picture

Upload 32 files

3c428bc verified about 1 month ago

history blame contribute delete

2.62 kB

	import os
	import json
	import torch
	import random
	import numpy as np
	from utils import *
	from tqdm import tqdm
	from samplings import *
	import argparse

	def list_files_in_directory(directories, extensions=["npy"]):
	file_list = []

	for directory in directories:
	for root, dirs, files in os.walk(directory):
	for file in files:
	if any(file.endswith(ext) for ext in extensions):
	file_path = os.path.join(root, file)
	file_list.append(file_path)

	return file_list

	if __name__ == "__main__":
	# Setup argument parser
	parser = argparse.ArgumentParser(description="Feature extraction and classification with CLaMP2.")
	parser.add_argument("feature_folder", type=str, help="Directory containing input feature files.")
	parser.add_argument("output_file", type=str, help="File to save the classification results. (format: json)")

	# Parse arguments
	args = parser.parse_args()
	feature_folder = args.feature_folder
	output_file = args.output_file

	device = torch.device("cuda") if torch.cuda.is_available() else torch.device("cpu")
	seed = 42
	random.seed(seed)
	np.random.seed(seed)
	torch.manual_seed(seed)
	torch.cuda.manual_seed_all(seed)
	torch.backends.cudnn.deterministic = True
	torch.backends.cudnn.benchmark = False

	checkpoint = torch.load(WEIGHTS_PATH, map_location='cpu')
	print(f"Successfully Loaded Checkpoint from Epoch {checkpoint['epoch']} with acc {checkpoint['max_eval_acc']}")
	label2idx = checkpoint['labels']
	idx2label = {idx: label for label, idx in label2idx.items()} # Create reverse mapping
	model = LinearClassification(num_classes=len(label2idx))
	model = model.to(device)

	# print parameter number
	print("Parameter Number: "+str(sum(p.numel() for p in model.parameters() if p.requires_grad)))

	model.eval()
	model.load_state_dict(checkpoint['model'])

	# load filenames under train and eval folder
	feature_files = list_files_in_directory([feature_folder])
	cls_results = {}

	for filepath in tqdm(feature_files):
	outputs = np.load(filepath)[0]
	outputs = torch.from_numpy(outputs).to(device)
	outputs = outputs.unsqueeze(0)
	cls_list = model(outputs)[0].tolist()
	max_prob = max(cls_list)
	cls_idx = cls_list.index(max_prob)
	cls_label = idx2label[cls_idx]
	cls_results[filepath] = cls_label

	with open(output_file, "w", encoding="utf-8") as f:
	json.dump(cls_results, f)