|
|
|
@ -3,6 +3,10 @@ import torch
|
|
|
|
|
import comfy.model_management
|
|
|
|
|
import folder_paths
|
|
|
|
|
import os
|
|
|
|
|
import io
|
|
|
|
|
import json
|
|
|
|
|
import struct
|
|
|
|
|
from comfy.cli_args import args
|
|
|
|
|
|
|
|
|
|
class EmptyLatentAudio:
|
|
|
|
|
def __init__(self):
|
|
|
|
@ -53,6 +57,61 @@ class VAEDecodeAudio:
|
|
|
|
|
audio = vae.decode(samples["samples"]).movedim(-1, 1)
|
|
|
|
|
return ({"waveform": audio, "sample_rate": 44100}, )
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def create_vorbis_comment_block(comment_dict, last_block):
|
|
|
|
|
vendor_string = b'ComfyUI'
|
|
|
|
|
vendor_length = len(vendor_string)
|
|
|
|
|
|
|
|
|
|
comments = []
|
|
|
|
|
for key, value in comment_dict.items():
|
|
|
|
|
comment = f"{key}={value}".encode('utf-8')
|
|
|
|
|
comments.append(struct.pack('<I', len(comment)) + comment)
|
|
|
|
|
|
|
|
|
|
user_comment_list_length = len(comments)
|
|
|
|
|
user_comments = b''.join(comments)
|
|
|
|
|
|
|
|
|
|
comment_data = struct.pack('<I', vendor_length) + vendor_string + struct.pack('<I', user_comment_list_length) + user_comments
|
|
|
|
|
if last_block:
|
|
|
|
|
id = b'\x84'
|
|
|
|
|
else:
|
|
|
|
|
id = b'\x04'
|
|
|
|
|
comment_block = id + struct.pack('>I', len(comment_data))[1:] + comment_data
|
|
|
|
|
|
|
|
|
|
return comment_block
|
|
|
|
|
|
|
|
|
|
def insert_or_replace_vorbis_comment(flac_io, comment_dict):
|
|
|
|
|
if len(comment_dict) == 0:
|
|
|
|
|
return flac_io
|
|
|
|
|
|
|
|
|
|
flac_io.seek(4)
|
|
|
|
|
|
|
|
|
|
blocks = []
|
|
|
|
|
last_block = False
|
|
|
|
|
|
|
|
|
|
while not last_block:
|
|
|
|
|
header = flac_io.read(4)
|
|
|
|
|
last_block = (header[0] & 0x80) != 0
|
|
|
|
|
block_type = header[0] & 0x7F
|
|
|
|
|
block_length = struct.unpack('>I', b'\x00' + header[1:])[0]
|
|
|
|
|
block_data = flac_io.read(block_length)
|
|
|
|
|
|
|
|
|
|
if block_type == 4 or block_type == 1:
|
|
|
|
|
pass
|
|
|
|
|
else:
|
|
|
|
|
header = bytes([(header[0] & (~0x80))]) + header[1:]
|
|
|
|
|
blocks.append(header + block_data)
|
|
|
|
|
|
|
|
|
|
blocks.append(create_vorbis_comment_block(comment_dict, last_block=True))
|
|
|
|
|
|
|
|
|
|
new_flac_io = io.BytesIO()
|
|
|
|
|
new_flac_io.write(b'fLaC')
|
|
|
|
|
for block in blocks:
|
|
|
|
|
new_flac_io.write(block)
|
|
|
|
|
|
|
|
|
|
new_flac_io.write(flac_io.read())
|
|
|
|
|
return new_flac_io
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class SaveAudio:
|
|
|
|
|
def __init__(self):
|
|
|
|
|
self.output_dir = folder_paths.get_output_directory()
|
|
|
|
@ -78,11 +137,27 @@ class SaveAudio:
|
|
|
|
|
filename_prefix += self.prefix_append
|
|
|
|
|
full_output_folder, filename, counter, subfolder, filename_prefix = folder_paths.get_save_image_path(filename_prefix, self.output_dir)
|
|
|
|
|
results = list()
|
|
|
|
|
|
|
|
|
|
metadata = {}
|
|
|
|
|
if not args.disable_metadata:
|
|
|
|
|
if prompt is not None:
|
|
|
|
|
metadata["prompt"] = json.dumps(prompt)
|
|
|
|
|
if extra_pnginfo is not None:
|
|
|
|
|
for x in extra_pnginfo:
|
|
|
|
|
metadata[x] = json.dumps(extra_pnginfo[x])
|
|
|
|
|
|
|
|
|
|
for (batch_number, waveform) in enumerate(audio["waveform"]):
|
|
|
|
|
#TODO: metadata
|
|
|
|
|
filename_with_batch_num = filename.replace("%batch_num%", str(batch_number))
|
|
|
|
|
file = f"{filename_with_batch_num}_{counter:05}_.flac"
|
|
|
|
|
torchaudio.save(os.path.join(full_output_folder, file), waveform, audio["sample_rate"], format="FLAC")
|
|
|
|
|
|
|
|
|
|
buff = io.BytesIO()
|
|
|
|
|
torchaudio.save(buff, waveform, audio["sample_rate"], format="FLAC")
|
|
|
|
|
|
|
|
|
|
buff = insert_or_replace_vorbis_comment(buff, metadata)
|
|
|
|
|
|
|
|
|
|
with open(os.path.join(full_output_folder, file), 'wb') as f:
|
|
|
|
|
f.write(buff.getbuffer())
|
|
|
|
|
|
|
|
|
|
results.append({
|
|
|
|
|
"filename": file,
|
|
|
|
|
"subfolder": subfolder,
|
|
|
|
|