@@ -169,7 +169,7 @@ class Distances(CustomBaseModel):
169
169
an optimal sensitivity of this privacy assessment it is recommended to use a 50/50 split between training and
170
170
holdout data, and then generate synthetic data of the same size.
171
171
172
- The embeddings of these samples are then computed, and the L2 nearest neighbor distances are calculated for each
172
+ The embeddings of these samples are then computed, and the nearest neighbor distances are calculated for each
173
173
synthetic sample to the training and holdout samples. Based on these nearest neighbor distances the following
174
174
metrics are calculated:
175
175
- Identical Match Share (IMS): The share of synthetic samples that are identical to a training or holdout sample.
@@ -205,19 +205,19 @@ class Distances(CustomBaseModel):
205
205
dcr_training : float | None = Field (
206
206
default = None ,
207
207
alias = "dcrTraining" ,
208
- description = "Average L2 nearest-neighbor distance between synthetic and training samples." ,
208
+ description = "Average nearest-neighbor distance between synthetic and training samples." ,
209
209
ge = 0.0 ,
210
210
)
211
211
dcr_holdout : float | None = Field (
212
212
default = None ,
213
213
alias = "dcrHoldout" ,
214
- description = "Average L2 nearest-neighbor distance between synthetic and holdout samples. Serves as a reference for `dcr_training`." ,
214
+ description = "Average nearest-neighbor distance between synthetic and holdout samples. Serves as a reference for `dcr_training`." ,
215
215
ge = 0.0 ,
216
216
)
217
217
dcr_trn_hol : float | None = Field (
218
218
default = None ,
219
219
alias = "dcrTrnHol" ,
220
- description = "Average L2 nearest-neighbor distance between training and holdout samples. Serves as a reference for `dcr_training`." ,
220
+ description = "Average nearest-neighbor distance between training and holdout samples. Serves as a reference for `dcr_training`." ,
221
221
ge = 0.0 ,
222
222
)
223
223
dcr_share : float | None = Field (
0 commit comments