@prefix this: <https://w3id.org/kpxl/ios/ds/np/RAn08NC9isAMOUJCNaGrh31KHTSet2xemhzqS9YNB49hQ> .
@prefix sub: <https://w3id.org/kpxl/ios/ds/np/RAn08NC9isAMOUJCNaGrh31KHTSet2xemhzqS9YNB49hQ#> .
@prefix np: <http://www.nanopub.org/nschema#> .
@prefix dct: <http://purl.org/dc/terms/> .
@prefix rdf: <http://www.w3.org/1999/02/22-rdf-syntax-ns#> .
@prefix nt: <https://w3id.org/np/o/ntemplate/> .
@prefix npx: <http://purl.org/nanopub/x/> .
@prefix xsd: <http://www.w3.org/2001/XMLSchema#> .
@prefix rdfs: <http://www.w3.org/2000/01/rdf-schema#> .
@prefix orcid: <https://orcid.org/> .
@prefix ns1: <http://purl.org/np/> .
@prefix prov: <http://www.w3.org/ns/prov#> .
@prefix foaf: <http://xmlns.com/foaf/0.1/> .
sub:Head {
  this: np:hasAssertion sub:assertion ;
    np:hasProvenance sub:provenance ;
    np:hasPublicationInfo sub:pubinfo ;
    a np:Nanopublication .
}
sub:assertion {
  <http://id.crossref.org/issn/2451-8492> dct:title "Data Science" .
  <https://doi.org/10.3233/DS-240059> dct:abstract "Measuring data drift is essential in machine learning applications where model scoring (evaluation) is done on data samples that differ from those used in training. The Kullback-Leibler divergence is a common measure of shifted probability distributions, for which discretized versions are invented to deal with binned or categorical data. We present the Unstable Population Indicator, a robust, flexible and numerically stable, discretized implementation of Jeffrey's divergence, along with an implementation in a Python package that can deal with continuous, discrete, ordinal and nominal data in a variety of popular data types. We show the numerical and statistical properties in controlled experiments. It is not advised to employ a common cut-off to distinguish stable from unstable populations, but rather to let that cut-off depend on the use case." ;
    dct:date "2024-06-26" ;
    dct:hasPart <https://w3id.org/kpxl/ios/ds/np/RA0XRooQKz2A7aoP0VJLS2NKcvQv-n7RwPoYtcD4wtTPc> ;
    dct:isPartOf <http://id.crossref.org/issn/2451-8492> ;
    dct:title "Measuring Data Drift with the Unstable Population Indicator" ;
    a <http://purl.org/spar/fabio/ResourcePaper> .
  orcid:0000-0003-2581-8370 <http://schema.org/affiliation> <https://ror.org/04dkp9463> , <https://ror.org/05xvt9f17> ;
    <http://schema.org/email> "datascience@marcelhaas.com" ;
    foaf:name "Marcel R. Haas" .
  orcid:0009-0003-5030-0108 <http://schema.org/affiliation> <https://ror.org/04b8v1s79> , <https://ror.org/04dkp9463> ;
    <http://schema.org/email> "L.Sibbald@tilburguniversity.edu" ;
    foaf:name "Lisette Sibbald" .
  <https://ror.org/04b8v1s79> foaf:name "Department of Methodology and Statistics and Department of Cognitive Neuropsychology, Tilburg University, Prof. Cobbenhagenlaan 125, 5037 DB Tilburg, The Netherlands" .
  <https://ror.org/04dkp9463> foaf:name "Business Intelligence, University of Amsterdam, Spui 21, 1012WX Amsterdam, The Netherlands" .
  <https://ror.org/05xvt9f17> foaf:name "Public Health and Primary Care, Leiden University Medical Center, Albinusdreef 2, The Netherlands" .
  sub:author-list rdf:_1 orcid:0000-0003-2581-8370 .
  sub:author-list__1 rdf:_2 orcid:0009-0003-5030-0108 .
}
sub:provenance {
  sub:assertion prov:wasAttributedTo orcid:0000-0003-2581-8370 , orcid:0009-0003-5030-0108 .
}
sub:pubinfo {
  orcid:0000-0002-1267-0234 foaf:name "Tobias Kuhn" .
  orcid:0000-0003-2581-8370 foaf:name "Marcel R. Haas" .
  orcid:0009-0003-5030-0108 foaf:name "Lisette Sibbald" .
  sub:author-list rdf:_1 orcid:0000-0003-2581-8370 ;
    rdf:_2 orcid:0009-0003-5030-0108 .
  sub:sig npx:hasAlgorithm "RSA" ;
    npx:hasPublicKey "MIGfMA0GCSqGSIb3DQEBAQUAA4GNADCBiQKBgQCjDGQCS1S+SRnERDuYDXOugdYUP0efEquHJEEHAbU/uLzBVlga89zqrNPCS7fBE6lArBUWEmT8eLKdMapyqvAzI1J3jUWTMhDJF+XFBkUiuiFfNSc4vJJcmi0yujtnuzXsRIG202jyaP4f5ULoskFwaZOSBZJfiE0dsB3D7DTIAQIDAQAB" ;
    npx:hasSignature "Ox+5X6nHLumNtHd4Ka2ICEWhUX+v6KVWn4UKDEEAixySaGj9TJt/mBFpssxtxcrM29g070GCs1SakxQ2Re3c6lUEEkHh/E4MLDc9ReR2vZoLi2oUzJfKzWC+WuTjML12q88gZUw9uoWThRpPW+j4XOn8dUrPk8DffrF/R1+Hrg8=" ;
    npx:hasSignatureTarget this: ;
    npx:signedBy orcid:0000-0002-1267-0234 .
  this: dct:created "2024-07-12T09:07:29.273Z"^^xsd:dateTime ;
    dct:creator orcid:0000-0002-1267-0234 ;
    dct:isPartOf <https://doi.org/10.3233/DS-240059> ;
    dct:license <https://creativecommons.org/licenses/by/4.0/> ;
    npx:hasNanopubType <http://purl.org/spar/fabio/ScholarlyWork> , <https://w3id.org/kpxl/ios/ds/terms/DataScienceNanopub> ;
    npx:introduces <https://doi.org/10.3233/DS-240059> ;
    npx:supersedes <https://w3id.org/kpxl/ios/ds/np/RALO1noJ6z4w0bumoQuKpUVKT7HE_zagqAA8Qy4djeLg0> ;
    npx:wasCreatedAt <https://nanodash.petapico.org/> ;
    <http://purl.org/ontology/bibo/authorList> sub:author-list ;
    rdfs:label "Article: Measuring Data Drift with the Unstable Population Indicator" ;
    nt:wasCreatedFromProvenanceTemplate ns1:RAi6zZAwhaJ23Hzg4lIjlPir6Take3ZQp-lS9skfBEwfQ ;
    nt:wasCreatedFromPubinfoTemplate ns1:RAA2MfqdBCzmz9yVWjKLXNbyfBNcwsMmOqcNUxkk1maIM , ns1:RAh1gm83JiG5M6kDxXhaYT1l49nCzyrckMvTzcPn-iv90 , ns1:RAjpBMlw3owYhJUBo3DtsuDlXsNAJ8cnGeWAutDVjuAuI , <https://w3id.org/np/RA5R_qv3VsZIrDKd8Mr37x3HoKCsKkwN5tJVqgQsKhjTE> , <https://w3id.org/np/RAIabr2sRVJ-YOIwZRD__BVMJKnq3QtQw_mjLIGSACPAI> , <https://w3id.org/np/RA_JdI7pfDcyvEXLr_gper3h8egmNggeTqkJbyHrlMEdo> , <https://w3id.org/np/RAoWx0AJvNw-WqkGgZO4k8udNCg6kMcGZARN3DgO_5TII> ;
    nt:wasCreatedFromTemplate <https://w3id.org/np/RAeQJfX3lMDqtzyddnRmlBvxSoWohzEKzsaMKWrR8K6J0> .
}