Compare commits
No commits in common. "feeccf733cf46b124f7399ac93e53b27386a3ae6" and "d7fe504e1ec69ad5ad9a49237d62efff0bf8c93b" have entirely different histories.
feeccf733c
...
d7fe504e1e
@ -627,7 +627,7 @@ class MiniMindLM(PreTrainedModel):
|
||||
# Specific layers for v path
|
||||
self.downsample_v_specific = nn.Sequential(
|
||||
nn.Conv1d(128*8, 128, kernel_size=1, padding='same'),
|
||||
nn.Conv1d(128, self.params.knowledge_length, kernel_size=1, padding='same')
|
||||
nn.Conv1d(128, 8, kernel_size=1, padding='same')
|
||||
)
|
||||
|
||||
# Specific layers for q path
|
||||
|
@ -46,5 +46,5 @@ CUDA_VISIBLE_DEVICES=0,1,2,3 accelerate launch \
|
||||
--use_flash_attn \
|
||||
--profile \
|
||||
--profile_interval 10\
|
||||
--knowledge_num 16384 \
|
||||
--knowledge_length 64
|
||||
--knowlwdge_num 1024 \
|
||||
--knowlwdge_length 8
|
||||
|
Loading…
x
Reference in New Issue
Block a user