Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add precision classification metric #2293

Merged
merged 31 commits into from
Nov 20, 2024
Merged
Show file tree
Hide file tree
Changes from 1 commit
Commits
Show all changes
31 commits
Select commit Hold shift + click to select a range
c73438f
Implement confusion matrix and precision, first draft
Aug 21, 2024
63f4a1d
Implement confusion matrix
Sep 9, 2024
b9d71b6
format :D
Sep 9, 2024
eac29aa
add agg type to cm, reformat debug representation add testing.
Sep 20, 2024
59db68b
formating and tiny refactor
Sep 21, 2024
4261bd8
add ClassificationMetric trait, rename variables and types, move test…
Sep 21, 2024
5431a2f
change unwrap to expect
Sep 21, 2024
fd2e585
update book
Sep 21, 2024
56965e8
remove unused code
Sep 22, 2024
419438a
changes to make reusing code easier
Sep 22, 2024
dfac847
format :D
Sep 22, 2024
ea4b29c
change to static data tests
Sep 24, 2024
e23aa7b
remove classification metric trait, add auxiliary code for classific…
Oct 14, 2024
60a246b
move classification objects to classification.rs, use rstest, remove …
Oct 21, 2024
c145531
review docstring, add top_k for multiclass tasks.
Oct 23, 2024
0c984c4
move class averaging and metric computation to metric implementation,…
Oct 25, 2024
b0a2939
change struct and var names
Oct 25, 2024
f18e321
Merge branch 'main' into add-to-metrics
Oct 26, 2024
386802c
rename params, enforce nonzero for top_k param, optimize one_hot for …
Oct 30, 2024
b525527
add adaptor por classification input, correct one hot function
Nov 1, 2024
ff7611a
define default for ClassReduction, derive new for Precision metric wi…
Nov 8, 2024
4cbcff2
Merge branch 'main' into add-to-metrics
Nov 8, 2024
eeab0d3
expose PrecisionMetric, change metric initialization
Nov 8, 2024
aea207f
check one_hot input tensor has more than 1 classes and correct it's i…
Nov 16, 2024
410f273
Merge branch 'main' into add-to-metrics
Nov 16, 2024
746fa9d
implement adaptor for MultilabelClassificationOutput and Classificati…
Nov 16, 2024
7428b86
change with_top_k to take usize
Nov 18, 2024
58e1902
Merge branch 'main' into add-to-metrics
Nov 18, 2024
d598f00
Add precision config for binary, multiclass and multilabel
laggui Nov 18, 2024
1542ee9
Fix dummy_classification_input
laggui Nov 18, 2024
03ebe1d
make PrecisionMetric public
Nov 19, 2024
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Prev Previous commit
Next Next commit
review docstring, add top_k for multiclass tasks.
  • Loading branch information
Tiago Sanona committed Oct 23, 2024
commit c145531803ca3c75b794a7566b7dd7ae001cebb4
2 changes: 1 addition & 1 deletion crates/burn-train/src/metric/classification.rs
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
use burn_core::prelude::{Backend, Bool, Tensor};

/// The [classification metric](ClassificationMetric) input type.
/// Input for classification tasks.
#[derive(new, Debug, Clone)]
pub struct ClassificationInput<B: Backend> {
/// Sample x Class Non thresholded normalized predictions.
Expand Down
73 changes: 63 additions & 10 deletions crates/burn-train/src/metric/confusion_stats.rs
Original file line number Diff line number Diff line change
Expand Up @@ -34,12 +34,24 @@ impl<B: Backend> ConfusionStats<B> {
pub fn new(
predictions: Tensor<B, 2>,
targets: Tensor<B, 2, Bool>,
threshold: f64,
threshold: Option<f64>,
top_k: Option<usize>,
class_average: ClassAverageType,
) -> Self {
let thresholded_predictions = predictions.greater_elem(threshold);
let prediction_mask = match (threshold, top_k) {
(Some(threshold), None) => {
predictions.greater_elem(threshold)
},
(None, Some(top_k)) => {
let mask = predictions.zeros_like();
let values = predictions.ones_like().narrow(1, 0, top_k);
let indexes = predictions.argsort_descending(1).narrow(1, 0, top_k);
mask.scatter(1, indexes, values).bool()
}
_ => panic!("Either threshold (for binary or multilabel) or top_k (for multiclass) must be set."),
};
Self {
confusion_classes: thresholded_predictions.int() + targets.int() * 2,
confusion_classes: prediction_mask.int() + targets.int() * 2,
class_average,
}
}
Expand Down Expand Up @@ -133,6 +145,19 @@ mod tests {
use burn_core::prelude::TensorData;
use rstest::rstest;

#[rstest]
#[should_panic]
#[case::both_some(Some(THRESHOLD), Some(1))]
#[should_panic]
#[case::both_none(None, None)]
fn test_exclusive_threshold_top_k(
#[case] threshold: Option<f64>,
#[case] top_k: Option<usize>,
) {
let (predictions, targets) = dummy_classification_input(&Binary).into();
ConfusionStats::new(predictions, targets, threshold, top_k, Micro);
}

#[rstest]
#[case::binary_micro(Binary, Micro, [1].into())]
#[case::binary_macro(Binary, Macro, [1].into())]
Expand All @@ -146,7 +171,11 @@ mod tests {
#[case] expected: Vec<i64>,
) {
let (predictions, targets) = dummy_classification_input(&class_type).into();
ConfusionStats::new(predictions, targets, THRESHOLD, avg_type)
let (threshold, top_k) = match class_type {
Multiclass => (None, Some(1)),
_ => (Some(THRESHOLD), None),
};
ConfusionStats::new(predictions, targets, threshold, top_k, avg_type)
.true_positive()
.int()
.into_data()
Expand All @@ -166,7 +195,11 @@ mod tests {
#[case] expected: Vec<i64>,
) {
let (predictions, targets) = dummy_classification_input(&class_type).into();
ConfusionStats::new(predictions, targets, THRESHOLD, avg_type)
let (threshold, top_k) = match class_type {
Multiclass => (None, Some(1)),
_ => (Some(THRESHOLD), None),
};
ConfusionStats::new(predictions, targets, threshold, top_k, avg_type)
.true_negative()
.int()
.into_data()
Expand All @@ -186,7 +219,11 @@ mod tests {
#[case] expected: Vec<i64>,
) {
let (predictions, targets) = dummy_classification_input(&class_type).into();
ConfusionStats::new(predictions, targets, THRESHOLD, avg_type)
let (threshold, top_k) = match class_type {
Multiclass => (None, Some(1)),
_ => (Some(THRESHOLD), None),
};
ConfusionStats::new(predictions, targets, threshold, top_k, avg_type)
.false_positive()
.int()
.into_data()
Expand All @@ -206,7 +243,11 @@ mod tests {
#[case] expected: Vec<i64>,
) {
let (predictions, targets) = dummy_classification_input(&class_type).into();
ConfusionStats::new(predictions, targets, THRESHOLD, avg_type)
let (threshold, top_k) = match class_type {
Multiclass => (None, Some(1)),
_ => (Some(THRESHOLD), None),
};
ConfusionStats::new(predictions, targets, threshold, top_k, avg_type)
.false_negative()
.int()
.into_data()
Expand All @@ -226,7 +267,11 @@ mod tests {
#[case] expected: Vec<i64>,
) {
let (predictions, targets) = dummy_classification_input(&class_type).into();
ConfusionStats::new(predictions, targets, THRESHOLD, avg_type)
let (threshold, top_k) = match class_type {
Multiclass => (None, Some(1)),
_ => (Some(THRESHOLD), None),
};
ConfusionStats::new(predictions, targets, threshold, top_k, avg_type)
.positive()
.int()
.into_data()
Expand All @@ -246,7 +291,11 @@ mod tests {
#[case] expected: Vec<i64>,
) {
let (predictions, targets) = dummy_classification_input(&class_type).into();
ConfusionStats::new(predictions, targets, THRESHOLD, avg_type)
let (threshold, top_k) = match class_type {
Multiclass => (None, Some(1)),
_ => (Some(THRESHOLD), None),
};
ConfusionStats::new(predictions, targets, threshold, top_k, avg_type)
.negative()
.int()
.into_data()
Expand All @@ -266,7 +315,11 @@ mod tests {
#[case] expected: Vec<i64>,
) {
let (predictions, targets) = dummy_classification_input(&class_type).into();
ConfusionStats::new(predictions, targets, THRESHOLD, avg_type)
let (threshold, top_k) = match class_type {
Multiclass => (None, Some(1)),
_ => (Some(THRESHOLD), None),
};
ConfusionStats::new(predictions, targets, threshold, top_k, avg_type)
.predicted_positive()
.int()
.into_data()
Expand Down
36 changes: 28 additions & 8 deletions crates/burn-train/src/metric/precision.rs
Original file line number Diff line number Diff line change
Expand Up @@ -11,14 +11,17 @@ use core::marker::PhantomData;
pub struct PrecisionMetric<B: Backend> {
state: NumericMetricState,
_b: PhantomData<B>,
threshold: f64,
threshold: Option<f64>,
class_average: ClassAverageType,
top_k: Option<usize>,
}

#[allow(dead_code)]
impl<B: Backend> PrecisionMetric<B> {
/// Sets the threshold.
pub fn with_threshold(mut self, threshold: f64) -> Self {
self.threshold = threshold;
self.threshold = Some(threshold);
self.top_k = None;
self
}

Expand All @@ -27,6 +30,13 @@ impl<B: Backend> PrecisionMetric<B> {
self.class_average = class_average;
self
}

/// Sets the top k.
pub fn with_top_k(mut self, top_k: usize) -> Self {
self.top_k = Some(top_k);
self.threshold = None;
self
}
}

impl<B: Backend> Default for PrecisionMetric<B> {
Expand All @@ -35,8 +45,9 @@ impl<B: Backend> Default for PrecisionMetric<B> {
Self {
state: NumericMetricState::default(),
_b: PhantomData,
threshold: 0.5,
threshold: Some(0.5),
class_average: ClassAverageType::Micro,
top_k: None,
}
}
}
Expand All @@ -51,8 +62,14 @@ impl<B: Backend> Metric for PrecisionMetric<B> {
) -> MetricEntry {
let (predictions, targets) = input.clone().into();
let [sample_size, _] = input.predictions.dims();
let metric = ConfusionStats::new(predictions, targets, self.threshold, self.class_average)
.precision();
let metric = ConfusionStats::new(
predictions,
targets,
self.threshold,
self.top_k,
self.class_average,
)
.precision();

self.state.update(
100.0 * metric,
Expand Down Expand Up @@ -100,9 +117,12 @@ mod tests {
#[case] expected: f64,
) {
let input = dummy_classification_input(&class_type);
let mut metric = PrecisionMetric::<TestBackend>::default()
.with_threshold(THRESHOLD)
.with_class_average(avg_type);
let mut metric = PrecisionMetric::<TestBackend>::default();
metric = match class_type {
Multiclass => metric.with_top_k(1),
laggui marked this conversation as resolved.
Show resolved Hide resolved
_ => metric.with_threshold(THRESHOLD),
};
metric = metric.with_class_average(avg_type);
let _entry = metric.update(&input, &MetricMetadata::fake());
TensorData::from([metric.value()])
.assert_approx_eq(&TensorData::from([expected * 100.0]), 3)
Expand Down