@@ -58,49 +58,6 @@ class LoraConfig:
5858 bias = "none"
5959 lora_dropout : float = 0.05
6060
61- @dataclass
62- class aLoraConfig :
63- """
64- This is the configuration class to store the configuration of an Activated LoRA [`aLoraModel`].
65-
66- Args:
67- r (`int`):
68- Lora attention dimension (the "rank").
69- target_modules (List[str]]):
70- The names of the modules to apply the adapter to. \
71- If this is specified, only the modules with the specified \
72- names will be replaced. Please specify modules as per model architecture. \
73- If the value is ["all-linear"], \
74- then LORA selects all linear and Conv1D modules as per model architecture, \
75- except for the output layer.
76- lora_alpha (`int`):
77- The alpha parameter for Lora scaling.
78- lora_dropout (`float`):
79- The dropout probability for Lora layers.
80- bias (`str`):
81- Bias type for LoRA. Can be 'none', 'all' or 'lora_only'. \
82- If 'all' or 'lora_only', the corresponding biases will be updated during training. \
83- Be aware that this means that, even when disabling the adapters, the model \
84- will not produce the same output as the base model would have without adaptation.
85- activation_prompt:
86- String which indicates the start of the aLoRA generation.
87- """
88-
89- r : int = 8
90- lora_alpha : int = 32
91- target_modules : List [str ] = field (
92- default = None ,
93- metadata = {
94- "help" : "The names of the modules to apply LORA to. LORA selects modules which either \
95- completely match or "
96- 'end with one of the strings. If the value is ["all-linear"], \
97- then LORA selects all linear and Conv1D '
98- "modules except for the output layer."
99- },
100- )
101- bias = "none"
102- lora_dropout : float = 0.05
103- activation_prompt : str = None
10461
10562
10663@dataclass
0 commit comments