Skip to content

Commit

Permalink
Update utils.py
Browse files Browse the repository at this point in the history
  • Loading branch information
AakritiKinra authored Jan 10, 2025
1 parent be9518b commit 01556de
Showing 1 changed file with 1 addition and 1 deletion.
2 changes: 1 addition & 1 deletion llments/eval/factscore/utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -72,7 +72,7 @@ def _replace_linear_with_int8linear(model: nn.Module, modules_to_not_convert: st
model._modules[name] = QuantizedLinearInt8(linear_layer=module)
return

class QuantizedLinearInt8(Module):
class QuantizedLinearInt8(Module): # type: ignore
"""A simple but effictive implmenetion of Int8 quantization for linear layers.
The weights are quantized and stored as Int8, which saves ~50% of the gpu memory.
Expand Down

0 comments on commit 01556de

Please sign in to comment.