0925 add usable yamls

This commit is contained in:
FelixChan
2025-09-25 15:41:00 +08:00
parent a20c1ed814
commit 5b8bfd70e3
95 changed files with 906 additions and 47 deletions

View File

@ -14,7 +14,7 @@ defaults:
# - nn_params: remi8_main12_head_16_dim512
# - nn_params: nb5_embSum_diff_main12head16dim768_sub3
dataset: SOD # Pop1k7, Pop909, SOD, LakhClean,PretrainingDataset FinetuneDataset
dataset: LakhClean # Pop1k7, Pop909, SOD, LakhClean,PretrainingDataset FinetuneDataset
captions_path: dataset/midicaps/train_set.json
# dataset: SymphonyNet_Dataset # Pop1k7, Pop909, SOD, LakhClean

View File

@ -1,7 +1,7 @@
encoding_scheme: cp
num_features: 5
vocab_name: MusicTokenVocabCP
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention

View File

@ -1,7 +1,7 @@
encoding_scheme: cp
num_features: 5
vocab_name: MusicTokenVocabCP
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention

View File

@ -1,7 +1,7 @@
encoding_scheme: cp
num_features: 5
vocab_name: MusicTokenVocabCP
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: FeedForward

View File

@ -1,7 +1,7 @@
encoding_scheme: cp
num_features: 5
vocab_name: MusicTokenVocabCP
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: FeedForward

View File

@ -1,7 +1,7 @@
encoding_scheme: cp
num_features: 7
vocab_name: MusicTokenVocabCP
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention

View File

@ -1,7 +1,7 @@
encoding_scheme: cp
num_features: 7
vocab_name: MusicTokenVocabCP
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention

View File

@ -1,7 +1,7 @@
encoding_scheme: cp
num_features: 7
vocab_name: MusicTokenVocabCP
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: FeedForward

View File

@ -1,7 +1,7 @@
encoding_scheme: cp
num_features: 7
vocab_name: MusicTokenVocabCP
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: FeedForward

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: FeedForward

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: Parallel

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: RNN

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: SelfAttention

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 7
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 7
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 7
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: FeedForward

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 7
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: Parallel

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 7
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: RNN

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 7
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: SelfAttention

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SelfAttentionEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: AverageEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerCrossAttendDecoder
sub_decoder_name: DiffusionDecoder

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerFinetuningDecoder
sub_decoder_name: DiffusionDecoder

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerPrefixDecoder
sub_decoder_name: DiffusionDecoder

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerPretrainingDecoder
sub_decoder_name: DiffusionDecoder

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerCrossAttendDecoder
sub_decoder_name: DiffusionDecoder

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: FeedForward

View File

@ -1,7 +1,7 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: Parallel

View File

@ -1,7 +1,7 @@
encoding_scheme: remi
num_features: 5
vocab_name: LangTokenVocab
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SingleEmbedding
main_decoder_name: XtransformerDecoder
sub_decoder_name: SingleProjection

View File

@ -1,7 +1,7 @@
encoding_scheme: remi
num_features: 7
vocab_name: LangTokenVocab
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SingleEmbedding
main_decoder_name: XtransformerDecoder
sub_decoder_name: SingleProjection

View File

@ -1,7 +1,7 @@
encoding_scheme: remi
num_features: 8
vocab_name: LangTokenVocab
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SingleEmbedding
main_decoder_name: XtransformerDecoder
sub_decoder_name: SingleProjection

View File

@ -1,7 +1,7 @@
encoding_scheme: remi
num_features: 8
vocab_name: LangTokenVocab
model_name: NestedMusicTransformer
model_name: AmadeusModel
input_embedder_name: SingleEmbedding
main_decoder_name: XtransformerDecoder
sub_decoder_name: SingleProjection

View File

@ -0,0 +1,20 @@
# 读取路径下所有的yaml文件批量替换指定的字符串
import os
import yaml
import glob
import re
# 指定要替换的字符串和新的字符串
old_string = 'NestedMusicTransformer'
new_string = 'AmadeusModel'
# 指定yaml文件所在的目录
directory = 'Amadeus/symbolic_yamls/nn_params'
# 遍历目录下的所有yaml文件
for filepath in glob.glob(os.path.join(directory, '*.yaml')):
with open(filepath, 'r', encoding='utf-8') as file:
content = file.read()
# 使用正则表达式替换指定的字符串
new_content = re.sub(r'\b' + re.escape(old_string) + r'\b', new_string, content)
# 将修改后的内容写回文件
with open(filepath, 'w', encoding='utf-8') as file:
file.write(new_content)
print(f'Processed file: {filepath}')

View File

@ -0,0 +1,20 @@
encoding_scheme: cp
num_features: 5
vocab_name: MusicTokenVocabCP
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
input_length: 1024
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: True

View File

@ -0,0 +1,20 @@
encoding_scheme: cp
num_features: 5
vocab_name: MusicTokenVocabCP
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
input_length: 1024
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: False

View File

@ -0,0 +1,18 @@
encoding_scheme: cp
num_features: 5
vocab_name: MusicTokenVocabCP
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: FeedForward
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1

View File

@ -0,0 +1,19 @@
encoding_scheme: cp
num_features: 5
vocab_name: MusicTokenVocabCP
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: FeedForward
model_dropout: 0.1
partial_sequential_prediction: True
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1

View File

@ -0,0 +1,19 @@
encoding_scheme: cp
num_features: 7
vocab_name: MusicTokenVocabCP
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: True

View File

@ -0,0 +1,19 @@
encoding_scheme: cp
num_features: 7
vocab_name: MusicTokenVocabCP
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: False

View File

@ -0,0 +1,18 @@
encoding_scheme: cp
num_features: 7
vocab_name: MusicTokenVocabCP
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: FeedForward
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1

View File

@ -0,0 +1,20 @@
encoding_scheme: cp
num_features: 7
vocab_name: MusicTokenVocabCP
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: FeedForward
model_dropout: 0.1
partial_sequential_prediction: True
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
input_length: 1024
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: True

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: True

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 12
num_head: 16
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 3
feature_enricher_use: False

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 768
num_layer: 12
num_head: 16
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 3
feature_enricher_use: False

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: False

View File

@ -0,0 +1,18 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: FeedForward
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1

View File

@ -0,0 +1,18 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: Parallel
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1

View File

@ -0,0 +1,18 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: RNN
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1

View File

@ -0,0 +1,18 @@
encoding_scheme: nb
num_features: 5
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: SelfAttention
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 7
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: True

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 7
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: False

View File

@ -0,0 +1,18 @@
encoding_scheme: nb
num_features: 7
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: FeedForward
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1

View File

@ -0,0 +1,18 @@
encoding_scheme: nb
num_features: 7
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: Parallel
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1

View File

@ -0,0 +1,18 @@
encoding_scheme: nb
num_features: 7
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: RNN
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1

View File

@ -0,0 +1,18 @@
encoding_scheme: nb
num_features: 7
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: SelfAttention
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SelfAttentionEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: False

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: True

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 12
num_head: 16
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: True

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 12
num_head: 16
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 3
feature_enricher_use: True

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: CrossAttention
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 6
feature_enricher_use: True

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: False

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder
model_dropout: 0.2
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 768
num_layer: 16
num_head: 12
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: False

View File

@ -0,0 +1,20 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 12
num_head: 16
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: True

View File

@ -0,0 +1,20 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: AverageEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 12
num_head: 16
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: True

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 12
num_head: 16
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 3
feature_enricher_use: True

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 2
feature_enricher_use: False

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: DiffusionDecoder
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 6
feature_enricher_use: True

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerCrossAttendDecoder
sub_decoder_name: DiffusionDecoder
model_dropout: 0.2
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 768
num_layer: 16
num_head: 12
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: False

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerFinetuningDecoder
sub_decoder_name: DiffusionDecoder
model_dropout: 0.2
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 768
num_layer: 20
num_head: 12
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: False

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerPrefixDecoder
sub_decoder_name: DiffusionDecoder
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 768
num_layer: 16
num_head: 12
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: False

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerPretrainingDecoder
sub_decoder_name: DiffusionDecoder
model_dropout: 0
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 768
num_layer: 20
num_head: 12
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: False

View File

@ -0,0 +1,19 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerCrossAttendDecoder
sub_decoder_name: DiffusionDecoder
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1
feature_enricher_use: False

View File

@ -0,0 +1,18 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: FeedForward
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1

View File

@ -0,0 +1,18 @@
encoding_scheme: nb
num_features: 8
vocab_name: MusicTokenVocabNB
model_name: NestedMusicTransformer
input_embedder_name: SummationEmbedder
main_decoder_name: XtransformerDecoder
sub_decoder_name: Parallel
model_dropout: 0.1
input_embedder:
num_layer: 1
num_head: 8
main_decoder:
dim_model: 512
num_layer: 6
num_head: 8
sub_decoder:
decout_window_size: 1 # 1 means no previous decoding output added
num_layer: 1

View File

@ -0,0 +1,12 @@
encoding_scheme: remi
num_features: 5
vocab_name: LangTokenVocab
model_name: NestedMusicTransformer
input_embedder_name: SingleEmbedding
main_decoder_name: XtransformerDecoder
sub_decoder_name: SingleProjection
model_dropout: 0.1
main_decoder:
dim_model: 512
num_layer: 8
num_head: 8

View File

@ -0,0 +1,12 @@
encoding_scheme: remi
num_features: 7
vocab_name: LangTokenVocab
model_name: NestedMusicTransformer
input_embedder_name: SingleEmbedding
main_decoder_name: XtransformerDecoder
sub_decoder_name: SingleProjection
model_dropout: 0.1
main_decoder:
dim_model: 512
num_layer: 8
num_head: 8

View File

@ -0,0 +1,12 @@
encoding_scheme: remi
num_features: 8
vocab_name: LangTokenVocab
model_name: NestedMusicTransformer
input_embedder_name: SingleEmbedding
main_decoder_name: XtransformerDecoder
sub_decoder_name: SingleProjection
model_dropout: 0.1
main_decoder:
dim_model: 512
num_layer: 8
num_head: 8

View File

@ -0,0 +1,12 @@
encoding_scheme: remi
num_features: 8
vocab_name: LangTokenVocab
model_name: NestedMusicTransformer
input_embedder_name: SingleEmbedding
main_decoder_name: XtransformerDecoder
sub_decoder_name: SingleProjection
model_dropout: 0.1
main_decoder:
dim_model: 512
num_layer: 12
num_head: 16