[c++] Add CPU version of standard R-squared metric #7008

nicklamiller · 2025-08-22T03:41:56Z

Contributes to: #6983

Adds R-squared to regression metrics as R2Metric

Since this metric measures goodness of fit i.e. higher is better, I made it a subclass of Metric instead of a subclass of RegressionMetric (like the other regression metrics, which measure loss/error) and used a very similar approach to how AveragePrecisionMetric is defined in binary_metric.hpp:

LightGBM/src/metric/binary_metric.hpp

Lines 270 to 385 in 8d7b6f9

    
           class AveragePrecisionMetric: public Metric { 
        
            public: 
        
             explicit AveragePrecisionMetric(const Config&) { 
        
             } 
        
             virtual ~AveragePrecisionMetric() { 
        
             } 
        
             const std::vector<std::string>& GetName() const override { 
        
               return name_; 
        
             } 
        
             double factor_to_bigger_better() const override { 
        
               return 1.0f; 
        
             } 
        
             void Init(const Metadata& metadata, data_size_t num_data) override { 
        
               name_.emplace_back("average_precision"); 
        
               num_data_ = num_data; 
        
               // get label 
        
               label_ = metadata.label(); 
        
               // get weights 
        
               weights_ = metadata.weights(); 
        
               if (weights_ == nullptr) { 
        
                 sum_weights_ = static_cast<double>(num_data_); 
        
               } else { 
        
                 sum_weights_ = 0.0f; 
        
                 for (data_size_t i = 0; i < num_data; ++i) { 
        
                   sum_weights_ += weights_[i]; 
        
                 } 
        
               } 
        
             } 
        
             std::vector<double> Eval(const double* score, const ObjectiveFunction*) const override { 
        
               // get indices sorted by score, descending order 
        
               std::vector<data_size_t> sorted_idx; 
        
               for (data_size_t i = 0; i < num_data_; ++i) { 
        
                 sorted_idx.emplace_back(i); 
        
               } 
        
               Common::ParallelSort(sorted_idx.begin(), sorted_idx.end(), [score](data_size_t a, data_size_t b) {return score[a] > score[b]; }); 
        
               // temp sum of positive label 
        
               double cur_actual_pos = 0.0f; 
        
               // total sum of positive label 
        
               double sum_actual_pos = 0.0f; 
        
               // total sum of predicted positive 
        
               double sum_pred_pos = 0.0f; 
        
               // accumulated precision 
        
               double accum_prec = 1.0f; 
        
               // accumulated pr-auc 
        
               double accum = 0.0f; 
        
               // temp sum of negative label 
        
               double cur_neg = 0.0f; 
        
               double threshold = score[sorted_idx[0]]; 
        
               if (weights_ == nullptr) {  // no weights 
        
                 for (data_size_t i = 0; i < num_data_; ++i) { 
        
                   const label_t cur_label = label_[sorted_idx[i]]; 
        
                   const double cur_score = score[sorted_idx[i]]; 
        
                   // new threshold 
        
                   if (cur_score != threshold) { 
        
                     threshold = cur_score; 
        
                     // accumulate 
        
                     sum_actual_pos += cur_actual_pos; 
        
                     sum_pred_pos += cur_actual_pos + cur_neg; 
        
                     accum_prec = sum_actual_pos / sum_pred_pos; 
        
                     accum += cur_actual_pos * accum_prec; 
        
                     // reset 
        
                     cur_neg = cur_actual_pos = 0.0f; 
        
                   } 
        
                   cur_neg += (cur_label <= 0); 
        
                   cur_actual_pos += (cur_label > 0); 
        
                 } 
        
               } else {  // has weights 
        
                 for (data_size_t i = 0; i < num_data_; ++i) { 
        
                   const label_t cur_label = label_[sorted_idx[i]]; 
        
                   const double cur_score = score[sorted_idx[i]]; 
        
                   const label_t cur_weight = weights_[sorted_idx[i]]; 
        
                   // new threshold 
        
                   if (cur_score != threshold) { 
        
                     threshold = cur_score; 
        
                     // accumulate 
        
                     sum_actual_pos += cur_actual_pos; 
        
                     sum_pred_pos += cur_actual_pos + cur_neg; 
        
                     accum_prec = sum_actual_pos / sum_pred_pos; 
        
                     accum += cur_actual_pos * accum_prec; 
        
                     // reset 
        
                     cur_neg = cur_actual_pos = 0.0f; 
        
                   } 
        
                   cur_neg += (cur_label <= 0) * cur_weight; 
        
                   cur_actual_pos += (cur_label > 0) * cur_weight; 
        
                 } 
        
               } 
        
               sum_actual_pos += cur_actual_pos; 
        
               sum_pred_pos += cur_actual_pos + cur_neg; 
        
               accum_prec = sum_actual_pos / sum_pred_pos; 
        
               accum += cur_actual_pos * accum_prec; 
        
               double ap = 1.0f; 
        
               if (sum_actual_pos > 0.0f && sum_actual_pos != sum_weights_) { 
        
                 ap = accum / sum_actual_pos; 
        
               } 
        
               return std::vector<double>(1, ap); 
        
             } 
        
            private: 
        
             /*! \brief Number of data */ 
        
             data_size_t num_data_; 
        
             /*! \brief Pointer of label */ 
        
             const label_t* label_; 
        
             /*! \brief Pointer of weighs */ 
        
             const label_t* weights_; 
        
             /*! \brief Sum weights */ 
        
             double sum_weights_; 
        
             /*! \brief Name of test set */ 
        
             std::vector<std::string> name_; 
        
           };

For this PR I decided to skip the CUDA implementation, but planned to follow-up with that after this gets merged as part of Built-in R2 (R-squared) metric #6983

…ing errors

nicklamiller · 2025-08-25T17:31:54Z

src/metric/regression_metric.hpp

+      double local_sum_weights = 0.0f;
+      #pragma omp parallel for num_threads(OMP_NUM_THREADS()) schedule(static) reduction(+:local_sum_weights, sum_label)
+      for (data_size_t i = 0; i < num_data_; ++i) {
+        local_sum_weights += weights_[i];


Just wanted to give a heads up, I originally updated the sum_weights_ data member directly in this for-loop, but this resulted in CI failures on some of the R-package jobs for several builds on Windows with the following error (workflow run, line with specific error):

... error C3028: 'LightGBM::R2Metric::sum_weights_': only a variable or static data member can be used in a data-sharing clause ...

So now, the local_sum_weights variable is used in the pragma reduction clause and is updated in the loop, and then assigned to sum_weights_ below. I also had to do this for the total_sum_squares_ member by introducing the local_total_sum_squares variable.

Thanks for the explanation, makes sense to me! I can't think of a better way to do this, I think this small allocation is totally fine.

jameslamb

blegh I thought I submitted a review yesterday but guess I forgot to click "submit review"!

Thank you so much for this excellent PR! It's rare that I review a PR this large and have 0 comments... but I have 0 comments. You addressed everything I would have asked for... followed the project's style, added lightweight but also very effective tests, updated the docs and that list in the R package.

This is just an awesome PR, and I'm excited to add this to LightGBM. Thanks for your hard work!

jameslamb · 2025-08-27T02:45:43Z

I'm not that familiar with C++, so let's see if we can get one other reviewer to look... @borchero could you help us with a review here?

jameslamb · 2025-08-28T03:59:13Z

/gha run r-valgrind

jameslamb

I'd been hoping for another reviewer but looks like no one is available, and I'd been waiting to see valgrind results but I realize we don't need those because this PR isn't adding R-package tests anyway.

I'm confident enough in my ability to review these changes that I think we should just merge this.

On a re-review I left one more small suggestion. I'm going to just apply that and then merge this if/when CI passes.

Thanks again for the excellent contribution!

src/metric/metric.cpp

jameslamb · 2025-09-21T06:00:10Z

I think the "Optional checks" workflow is going to fail (like this) until we get a successful run of the valgrind workflow on this branch.... because I put up #7008 (comment) but the job wasn't triggered, for the reasons described in #7012

Sorry @nicklamiller , hopefully we'll be able to get #7035 or something similar merged soon and then re-run that workflow.

StrikerRUS

Thanks a lot for this contribution!
I have only two minor comments below:

tests/python_package_test/test_engine.py

StrikerRUS

@nicklamiller Thanks for your latest commit! I don't have any new comments.

StrikerRUS · 2025-10-10T17:16:59Z

Hmm... Errors in CI jobs looks very strange and unrelated to the PR. However, we don't have these errors in master branch.

@nicklamiller Could you please take a look?

StrikerRUS · 2025-10-13T08:52:36Z

@nicklamiller So it looks like y = y.copy() is the cause of strange unrelated CI errors, right?..

nicklamiller · 2025-10-13T16:43:40Z

So it looks like y = y.copy() is the cause of strange unrelated CI errors, right?..

@StrikerRUS Removing y = y.copy() was the issue, I should've posted my response in this main thread, but please see my comment above for more details.

I've added back y = y.copy() in e5b5868 and the seemingly unrelated tests that were failing now pass. The most recent CI run still fails with a new failure, though that appears to be an unrelated, flaky (API rate related) failure:

 urllib.error.HTTPError: HTTP Error 403: rate limit exceeded
The last reported status from workflow "R valgrind tests" is failure. Commit fixes and rerun the workflow.

Since the most recent failure appears to be flaky, I've merged in the master branch and pushed, so hopefully CI passes this time 🤞

jameslamb · 2025-10-13T17:30:15Z

That optional-checks failure isn't "flaky". I tried to trigger an optional workflow at #7008 (comment) but then saw it fail with the issues described in #7012.

I've put up #7035 attempting to fix that (and making it easier to fix such things in the future).

jameslamb · 2025-10-13T19:32:01Z

I've put up #7035 attempting to fix that (and making it easier to fix such things in the future).

@StrikerRUS if the latest changes here look ok to you, I'd be ok with you (temporarily!) changing the branch protection to allow merging this PR while optional-checks is failing. That way this PR doesn't need to be blocked by #7035.

StrikerRUS · 2025-10-13T20:43:38Z

@nicklamiller Oh, sorry, I missed in resolved thread your perfect description why unrelated tests were failing! Thanks a lot for the investigation and the fix!

@jameslamb

changing the branch protection to allow merging this PR

Sure, totally fine!

StrikerRUS · 2025-10-13T21:04:22Z

Close-reopen to fix license/cla status.

Add R-squared metric, documentation, and tests

aa3bcf6

nicklamiller requested review from StrikerRUS, borchero, guolinke, jameslamb, jmoralez and shiyu1994 as code owners August 22, 2025 03:41

nicklamiller mentioned this pull request Aug 22, 2025

Built-in R2 (R-squared) metric #6983

Open

nicklamiller marked this pull request as draft August 22, 2025 04:24

jameslamb added feature in progress labels Aug 23, 2025

nicklamiller added 3 commits August 24, 2025 19:23

Fix static ci checks: correct Sklearn r2_score URL link, fix cpp lint…

ec43778

…ing errors

Replace non-static data members from pragma reduction with variables

6ca5eb6

Merge remote-tracking branch 'upstream/master' into add-r2-metric

cb9ecdf

nicklamiller marked this pull request as ready for review August 25, 2025 03:42

nicklamiller commented Aug 25, 2025

View reviewed changes

jameslamb approved these changes Aug 27, 2025

View reviewed changes

jameslamb mentioned this pull request Aug 28, 2025

[ci] commented-triggered workflows broken: access forbidden for long-lived tokens #7012

Open

jameslamb added awaiting review and removed in progress labels Sep 1, 2025

jameslamb removed the awaiting review label Sep 17, 2025

jameslamb approved these changes Sep 17, 2025

View reviewed changes

src/metric/metric.cpp Outdated Show resolved Hide resolved

jameslamb added 2 commits September 16, 2025 23:11

Update src/metric/metric.cpp

57bda50

Merge branch 'master' into add-r2-metric

062d5e6

jameslamb approved these changes Sep 18, 2025

View reviewed changes

StrikerRUS reviewed Oct 1, 2025

View reviewed changes

tests/python_package_test/test_engine.py Show resolved Hide resolved

tests/python_package_test/test_engine.py Show resolved Hide resolved

Add additional asserts, remove needless y.copy()

23a1cf3

Merge remote-tracking branch 'upstream/master' into add-r2-metric

d8bc90f

StrikerRUS approved these changes Oct 9, 2025

View reviewed changes

StrikerRUS added 3 commits October 9, 2025 11:48

Merge branch 'master' into add-r2-metric

472df84

Merge branch 'master' into add-r2-metric

33aab02

Merge branch 'master' into add-r2-metric

b909450

nicklamiller added 2 commits October 10, 2025 11:29

Add back y.copy()

e5b5868

Merge remote-tracking branch 'upstream/master' into add-r2-metric

d49b8b9

Merge remote-tracking branch 'upstream/master' into add-r2-metric

e7871d4

Merge branch 'master' into add-r2-metric

340f39c

StrikerRUS closed this Oct 13, 2025

StrikerRUS reopened this Oct 13, 2025

StrikerRUS approved these changes Oct 13, 2025

View reviewed changes

StrikerRUS merged commit 6f0d7cc into microsoft:master Oct 13, 2025
96 of 108 checks passed

nicklamiller deleted the add-r2-metric branch October 15, 2025 17:49

	class AveragePrecisionMetric: public Metric {
	public:
	explicit AveragePrecisionMetric(const Config&) {
	}

	virtual ~AveragePrecisionMetric() {
	}

	const std::vector<std::string>& GetName() const override {
	return name_;
	}

	double factor_to_bigger_better() const override {
	return 1.0f;
	}

	void Init(const Metadata& metadata, data_size_t num_data) override {
	name_.emplace_back("average_precision");

	num_data_ = num_data;
	// get label
	label_ = metadata.label();
	// get weights
	weights_ = metadata.weights();

	if (weights_ == nullptr) {
	sum_weights_ = static_cast<double>(num_data_);
	} else {
	sum_weights_ = 0.0f;
	for (data_size_t i = 0; i < num_data; ++i) {
	sum_weights_ += weights_[i];
	}
	}
	}

	std::vector<double> Eval(const double* score, const ObjectiveFunction*) const override {
	// get indices sorted by score, descending order
	std::vector<data_size_t> sorted_idx;
	for (data_size_t i = 0; i < num_data_; ++i) {
	sorted_idx.emplace_back(i);
	}
	Common::ParallelSort(sorted_idx.begin(), sorted_idx.end(), [score](data_size_t a, data_size_t b) {return score[a] > score[b]; });
	// temp sum of positive label
	double cur_actual_pos = 0.0f;
	// total sum of positive label
	double sum_actual_pos = 0.0f;
	// total sum of predicted positive
	double sum_pred_pos = 0.0f;
	// accumulated precision
	double accum_prec = 1.0f;
	// accumulated pr-auc
	double accum = 0.0f;
	// temp sum of negative label
	double cur_neg = 0.0f;
	double threshold = score[sorted_idx[0]];
	if (weights_ == nullptr) { // no weights
	for (data_size_t i = 0; i < num_data_; ++i) {
	const label_t cur_label = label_[sorted_idx[i]];
	const double cur_score = score[sorted_idx[i]];
	// new threshold
	if (cur_score != threshold) {
	threshold = cur_score;
	// accumulate
	sum_actual_pos += cur_actual_pos;
	sum_pred_pos += cur_actual_pos + cur_neg;
	accum_prec = sum_actual_pos / sum_pred_pos;
	accum += cur_actual_pos * accum_prec;
	// reset
	cur_neg = cur_actual_pos = 0.0f;
	}
	cur_neg += (cur_label <= 0);
	cur_actual_pos += (cur_label > 0);
	}
	} else { // has weights
	for (data_size_t i = 0; i < num_data_; ++i) {
	const label_t cur_label = label_[sorted_idx[i]];
	const double cur_score = score[sorted_idx[i]];
	const label_t cur_weight = weights_[sorted_idx[i]];
	// new threshold
	if (cur_score != threshold) {
	threshold = cur_score;
	// accumulate
	sum_actual_pos += cur_actual_pos;
	sum_pred_pos += cur_actual_pos + cur_neg;
	accum_prec = sum_actual_pos / sum_pred_pos;
	accum += cur_actual_pos * accum_prec;
	// reset
	cur_neg = cur_actual_pos = 0.0f;
	}
	cur_neg += (cur_label <= 0) * cur_weight;
	cur_actual_pos += (cur_label > 0) * cur_weight;
	}
	}
	sum_actual_pos += cur_actual_pos;
	sum_pred_pos += cur_actual_pos + cur_neg;
	accum_prec = sum_actual_pos / sum_pred_pos;
	accum += cur_actual_pos * accum_prec;
	double ap = 1.0f;
	if (sum_actual_pos > 0.0f && sum_actual_pos != sum_weights_) {
	ap = accum / sum_actual_pos;
	}
	return std::vector<double>(1, ap);
	}

	private:
	/! \brief Number of data /
	data_size_t num_data_;
	/! \brief Pointer of label /
	const label_t* label_;
	/! \brief Pointer of weighs /
	const label_t* weights_;
	/! \brief Sum weights /
	double sum_weights_;
	/! \brief Name of test set /
	std::vector<std::string> name_;
	};

[c++] Add CPU version of standard R-squared metric #7008

[c++] Add CPU version of standard R-squared metric #7008

Conversation

nicklamiller commented Aug 22, 2025

Uh oh!

nicklamiller Aug 25, 2025

Choose a reason for hiding this comment

Uh oh!

jameslamb Aug 26, 2025

Choose a reason for hiding this comment

Uh oh!

jameslamb left a comment

Choose a reason for hiding this comment

Uh oh!

jameslamb commented Aug 27, 2025

Uh oh!

jameslamb commented Aug 28, 2025

Uh oh!

jameslamb left a comment

Choose a reason for hiding this comment

Uh oh!

Uh oh!

jameslamb commented Sep 21, 2025

Uh oh!

StrikerRUS left a comment

Choose a reason for hiding this comment

Uh oh!

Uh oh!

Uh oh!

StrikerRUS left a comment

Choose a reason for hiding this comment

Uh oh!

StrikerRUS commented Oct 10, 2025

Uh oh!

StrikerRUS commented Oct 13, 2025

Uh oh!

nicklamiller commented Oct 13, 2025

Uh oh!

jameslamb commented Oct 13, 2025

Uh oh!

jameslamb commented Oct 13, 2025

Uh oh!

StrikerRUS commented Oct 13, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Uh oh!

StrikerRUS commented Oct 13, 2025

Uh oh!

Uh oh!

Reviewers

Assignees

Labels

Projects

Milestone

Development

Uh oh!

3 participants

StrikerRUS commented Oct 13, 2025 •

edited

Loading