@@ -361,9 +361,7 @@ <h2>LoRA Embedding Layer</h2>
361
361
</ div >
362
362
< div class ='code '>
363
363
< div class ="highlight "> < pre > < span class ="lineno "> 123</ span > < span class ="k "> if</ span > < span class ="n "> alpha</ span > < span class ="ow "> is</ span > < span class ="kc "> None</ span > < span class ="p "> :</ span >
364
- < span class ="lineno "> 124</ span > < span class ="n "> alpha</ span > < span class ="o "> =</ span > < span class ="n "> r</ span >
365
- < span class ="lineno "> 125</ span >
366
- < span class ="lineno "> 126</ span > < span class ="n "> nn</ span > < span class ="o "> .</ span > < span class ="n "> Embedding</ span > </ pre > </ div >
364
+ < span class ="lineno "> 124</ span > < span class ="n "> alpha</ span > < span class ="o "> =</ span > < span class ="n "> r</ span > </ pre > </ div >
367
365
</ div >
368
366
</ div >
369
367
< div class ='section ' id ='section-22 '>
@@ -375,8 +373,8 @@ <h2>LoRA Embedding Layer</h2>
375
373
376
374
</ div >
377
375
< div class ='code '>
378
- < div class ="highlight "> < pre > < span class ="lineno "> 128 </ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> weight</ span > < span class ="o "> =</ span > < span class ="n "> nn</ span > < span class ="o "> .</ span > < span class ="n "> Parameter</ span > < span class ="p "> (</ span > < span class ="n "> torch</ span > < span class ="o "> .</ span > < span class ="n "> empty</ span > < span class ="p "> ((</ span > < span class ="n "> num_embeddings</ span > < span class ="p "> ,</ span > < span class ="n "> embedding_dim</ span > < span class ="p "> )))</ span >
379
- < span class ="lineno "> 129 </ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> weight</ span > < span class ="o "> .</ span > < span class ="n "> requires_grad</ span > < span class ="o "> =</ span > < span class ="kc "> False</ span > </ pre > </ div >
376
+ < div class ="highlight "> < pre > < span class ="lineno "> 127 </ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> weight</ span > < span class ="o "> =</ span > < span class ="n "> nn</ span > < span class ="o "> .</ span > < span class ="n "> Parameter</ span > < span class ="p "> (</ span > < span class ="n "> torch</ span > < span class ="o "> .</ span > < span class ="n "> empty</ span > < span class ="p "> ((</ span > < span class ="n "> num_embeddings</ span > < span class ="p "> ,</ span > < span class ="n "> embedding_dim</ span > < span class ="p "> )))</ span >
377
+ < span class ="lineno "> 128 </ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> weight</ span > < span class ="o "> .</ span > < span class ="n "> requires_grad</ span > < span class ="o "> =</ span > < span class ="kc "> False</ span > </ pre > </ div >
380
378
</ div >
381
379
</ div >
382
380
< div class ='section ' id ='section-23 '>
@@ -388,7 +386,7 @@ <h2>LoRA Embedding Layer</h2>
388
386
389
387
</ div >
390
388
< div class ='code '>
391
- < div class ="highlight "> < pre > < span class ="lineno "> 132 </ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> scaling</ span > < span class ="o "> =</ span > < span class ="n "> alpha</ span > < span class ="o "> /</ span > < span class ="n "> r</ span > </ pre > </ div >
389
+ < div class ="highlight "> < pre > < span class ="lineno "> 131 </ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> scaling</ span > < span class ="o "> =</ span > < span class ="n "> alpha</ span > < span class ="o "> /</ span > < span class ="n "> r</ span > </ pre > </ div >
392
390
</ div >
393
391
</ div >
394
392
< div class ='section ' id ='section-24 '>
@@ -400,7 +398,7 @@ <h2>LoRA Embedding Layer</h2>
400
398
401
399
</ div >
402
400
< div class ='code '>
403
- < div class ="highlight "> < pre > < span class ="lineno "> 134 </ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> lora_a</ span > < span class ="o "> =</ span > < span class ="n "> nn</ span > < span class ="o "> .</ span > < span class ="n "> Parameter</ span > < span class ="p "> (</ span > < span class ="n "> torch</ span > < span class ="o "> .</ span > < span class ="n "> empty</ span > < span class ="p "> ((</ span > < span class ="n "> r</ span > < span class ="p "> ,</ span > < span class ="n "> num_embeddings</ span > < span class ="p "> )))</ span > </ pre > </ div >
401
+ < div class ="highlight "> < pre > < span class ="lineno "> 133 </ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> lora_a</ span > < span class ="o "> =</ span > < span class ="n "> nn</ span > < span class ="o "> .</ span > < span class ="n "> Parameter</ span > < span class ="p "> (</ span > < span class ="n "> torch</ span > < span class ="o "> .</ span > < span class ="n "> empty</ span > < span class ="p "> ((</ span > < span class ="n "> r</ span > < span class ="p "> ,</ span > < span class ="n "> num_embeddings</ span > < span class ="p "> )))</ span > </ pre > </ div >
404
402
</ div >
405
403
</ div >
406
404
< div class ='section ' id ='section-25 '>
@@ -412,9 +410,9 @@ <h2>LoRA Embedding Layer</h2>
412
410
413
411
</ div >
414
412
< div class ='code '>
415
- < div class ="highlight "> < pre > < span class ="lineno "> 136 </ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> lora_b</ span > < span class ="o "> =</ span > < span class ="n "> nn</ span > < span class ="o "> .</ span > < span class ="n "> Parameter</ span > < span class ="p "> (</ span > < span class ="n "> torch</ span > < span class ="o "> .</ span > < span class ="n "> empty</ span > < span class ="p "> ((</ span > < span class ="n "> embedding_dim</ span > < span class ="p "> ,</ span > < span class ="n "> r</ span > < span class ="p "> )))</ span >
416
- < span class ="lineno "> 137 </ span >
417
- < span class ="lineno "> 138 </ span > < span class ="k "> with</ span > < span class ="n "> torch</ span > < span class ="o "> .</ span > < span class ="n "> no_grad</ span > < span class ="p "> ():</ span > </ pre > </ div >
413
+ < div class ="highlight "> < pre > < span class ="lineno "> 135 </ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> lora_b</ span > < span class ="o "> =</ span > < span class ="n "> nn</ span > < span class ="o "> .</ span > < span class ="n "> Parameter</ span > < span class ="p "> (</ span > < span class ="n "> torch</ span > < span class ="o "> .</ span > < span class ="n "> empty</ span > < span class ="p "> ((</ span > < span class ="n "> embedding_dim</ span > < span class ="p "> ,</ span > < span class ="n "> r</ span > < span class ="p "> )))</ span >
414
+ < span class ="lineno "> 136 </ span >
415
+ < span class ="lineno "> 137 </ span > < span class ="k "> with</ span > < span class ="n "> torch</ span > < span class ="o "> .</ span > < span class ="n "> no_grad</ span > < span class ="p "> ():</ span > </ pre > </ div >
418
416
</ div >
419
417
</ div >
420
418
< div class ='section ' id ='section-26 '>
@@ -426,7 +424,7 @@ <h2>LoRA Embedding Layer</h2>
426
424
427
425
</ div >
428
426
< div class ='code '>
429
- < div class ="highlight "> < pre > < span class ="lineno "> 140 </ span > < span class ="n "> nn</ span > < span class ="o "> .</ span > < span class ="n "> init</ span > < span class ="o "> .</ span > < span class ="n "> normal_</ span > < span class ="p "> (</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> lora_a</ span > < span class ="p "> )</ span > </ pre > </ div >
427
+ < div class ="highlight "> < pre > < span class ="lineno "> 139 </ span > < span class ="n "> nn</ span > < span class ="o "> .</ span > < span class ="n "> init</ span > < span class ="o "> .</ span > < span class ="n "> normal_</ span > < span class ="p "> (</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> lora_a</ span > < span class ="p "> )</ span > </ pre > </ div >
430
428
</ div >
431
429
</ div >
432
430
< div class ='section ' id ='section-27 '>
@@ -438,7 +436,7 @@ <h2>LoRA Embedding Layer</h2>
438
436
439
437
</ div >
440
438
< div class ='code '>
441
- < div class ="highlight "> < pre > < span class ="lineno "> 142 </ span > < span class ="n "> nn</ span > < span class ="o "> .</ span > < span class ="n "> init</ span > < span class ="o "> .</ span > < span class ="n "> zeros_</ span > < span class ="p "> (</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> lora_b</ span > < span class ="p "> )</ span > </ pre > </ div >
439
+ < div class ="highlight "> < pre > < span class ="lineno "> 141 </ span > < span class ="n "> nn</ span > < span class ="o "> .</ span > < span class ="n "> init</ span > < span class ="o "> .</ span > < span class ="n "> zeros_</ span > < span class ="p "> (</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> lora_b</ span > < span class ="p "> )</ span > </ pre > </ div >
442
440
</ div >
443
441
</ div >
444
442
< div class ='section ' id ='section-28 '>
@@ -449,7 +447,7 @@ <h2>LoRA Embedding Layer</h2>
449
447
450
448
</ div >
451
449
< div class ='code '>
452
- < div class ="highlight "> < pre > < span class ="lineno "> 144 </ span > < span class ="k "> def</ span > < span class ="nf "> forward</ span > < span class ="p "> (</ span > < span class ="bp "> self</ span > < span class ="p "> ,</ span > < span class ="n "> x</ span > < span class ="p "> :</ span > < span class ="n "> torch</ span > < span class ="o "> .</ span > < span class ="n "> Tensor</ span > < span class ="p "> ):</ span > </ pre > </ div >
450
+ < div class ="highlight "> < pre > < span class ="lineno "> 143 </ span > < span class ="k "> def</ span > < span class ="nf "> forward</ span > < span class ="p "> (</ span > < span class ="bp "> self</ span > < span class ="p "> ,</ span > < span class ="n "> x</ span > < span class ="p "> :</ span > < span class ="n "> torch</ span > < span class ="o "> .</ span > < span class ="n "> Tensor</ span > < span class ="p "> ):</ span > </ pre > </ div >
453
451
</ div >
454
452
</ div >
455
453
< div class ='section ' id ='section-29 '>
@@ -461,7 +459,7 @@ <h2>LoRA Embedding Layer</h2>
461
459
462
460
</ div >
463
461
< div class ='code '>
464
- < div class ="highlight "> < pre > < span class ="lineno "> 146 </ span > < span class ="n "> result</ span > < span class ="o "> =</ span > < span class ="n "> nn</ span > < span class ="o "> .</ span > < span class ="n "> functional</ span > < span class ="o "> .</ span > < span class ="n "> embedding</ span > < span class ="p "> (</ span > < span class ="n "> x</ span > < span class ="p "> ,</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> weight</ span > < span class ="p "> )</ span > </ pre > </ div >
462
+ < div class ="highlight "> < pre > < span class ="lineno "> 145 </ span > < span class ="n "> result</ span > < span class ="o "> =</ span > < span class ="n "> nn</ span > < span class ="o "> .</ span > < span class ="n "> functional</ span > < span class ="o "> .</ span > < span class ="n "> embedding</ span > < span class ="p "> (</ span > < span class ="n "> x</ span > < span class ="p "> ,</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> weight</ span > < span class ="p "> )</ span > </ pre > </ div >
465
463
</ div >
466
464
</ div >
467
465
< div class ='section ' id ='section-30 '>
@@ -473,7 +471,7 @@ <h2>LoRA Embedding Layer</h2>
473
471
474
472
</ div >
475
473
< div class ='code '>
476
- < div class ="highlight "> < pre > < span class ="lineno "> 149 </ span > < span class ="n "> result</ span > < span class ="o "> +=</ span > < span class ="p "> (</ span > < span class ="n "> nn</ span > < span class ="o "> .</ span > < span class ="n "> functional</ span > < span class ="o "> .</ span > < span class ="n "> embedding</ span > < span class ="p "> (</ span > < span class ="n "> x</ span > < span class ="p "> ,</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> lora_a</ span > < span class ="o "> .</ span > < span class ="n "> T</ span > < span class ="p "> )</ span > < span class ="o "> @</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> lora_b</ span > < span class ="o "> .</ span > < span class ="n "> T</ span > < span class ="p "> )</ span > < span class ="o "> *</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> scaling</ span > </ pre > </ div >
474
+ < div class ="highlight "> < pre > < span class ="lineno "> 148 </ span > < span class ="n "> result</ span > < span class ="o "> +=</ span > < span class ="p "> (</ span > < span class ="n "> nn</ span > < span class ="o "> .</ span > < span class ="n "> functional</ span > < span class ="o "> .</ span > < span class ="n "> embedding</ span > < span class ="p "> (</ span > < span class ="n "> x</ span > < span class ="p "> ,</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> lora_a</ span > < span class ="o "> .</ span > < span class ="n "> T</ span > < span class ="p "> )</ span > < span class ="o "> @</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> lora_b</ span > < span class ="o "> .</ span > < span class ="n "> T</ span > < span class ="p "> )</ span > < span class ="o "> *</ span > < span class ="bp "> self</ span > < span class ="o "> .</ span > < span class ="n "> scaling</ span > </ pre > </ div >
477
475
</ div >
478
476
</ div >
479
477
< div class ='section ' id ='section-31 '>
@@ -485,7 +483,7 @@ <h2>LoRA Embedding Layer</h2>
485
483
486
484
</ div >
487
485
< div class ='code '>
488
- < div class ="highlight "> < pre > < span class ="lineno "> 152 </ span > < span class ="k "> return</ span > < span class ="n "> result</ span > </ pre > </ div >
486
+ < div class ="highlight "> < pre > < span class ="lineno "> 151 </ span > < span class ="k "> return</ span > < span class ="n "> result</ span > </ pre > </ div >
489
487
</ div >
490
488
</ div >
491
489
< div class ='footer '>
0 commit comments