Compare commits

..

No commits in common. "feeccf733cf46b124f7399ac93e53b27386a3ae6" and "d7fe504e1ec69ad5ad9a49237d62efff0bf8c93b" have entirely different histories.

2 changed files with 3 additions and 3 deletions

View File

@ -627,7 +627,7 @@ class MiniMindLM(PreTrainedModel):
# Specific layers for v path # Specific layers for v path
self.downsample_v_specific = nn.Sequential( self.downsample_v_specific = nn.Sequential(
nn.Conv1d(128*8, 128, kernel_size=1, padding='same'), nn.Conv1d(128*8, 128, kernel_size=1, padding='same'),
nn.Conv1d(128, self.params.knowledge_length, kernel_size=1, padding='same') nn.Conv1d(128, 8, kernel_size=1, padding='same')
) )
# Specific layers for q path # Specific layers for q path

View File

@ -46,5 +46,5 @@ CUDA_VISIBLE_DEVICES=0,1,2,3 accelerate launch \
--use_flash_attn \ --use_flash_attn \
--profile \ --profile \
--profile_interval 10\ --profile_interval 10\
--knowledge_num 16384 \ --knowlwdge_num 1024 \
--knowledge_length 64 --knowlwdge_length 8