@prefix this: <https://w3id.org/np/RA6amI79BFW1axJuNM0PmqefGYO-SWR72EoGG5fb0KuB0> .
@prefix sub: <https://w3id.org/np/RA6amI79BFW1axJuNM0PmqefGYO-SWR72EoGG5fb0KuB0#> .
@prefix rdfs: <http://www.w3.org/2000/01/rdf-schema#> .
@prefix xsd: <http://www.w3.org/2001/XMLSchema#> .
@prefix np: <http://www.nanopub.org/nschema#> .
@prefix npx: <http://purl.org/nanopub/x/> .
@prefix dcterms: <http://purl.org/dc/terms/> .
@prefix prov: <http://www.w3.org/ns/prov#> .
@prefix schema: <https://schema.org/> .
@prefix foaf: <http://xmlns.com/foaf/0.1/> .
sub:head {
  this: np:hasAssertion sub:assertion ;
    np:hasProvenance sub:provenance ;
    np:hasPublicationInfo sub:pubinfo ;
    a np:Nanopublication .
}
sub:assertion {
  <https://arvix.org/abs/2207.15796> <https://sense-nets.xyz/hasZoteroItemType> "webpage" .
  sub:assertion dcterms:creator <https://w3id.org/np/RA8InlmUPoZ6CTtHP_RkqFBHJSnasnRcjI3qz7EJ-nHJY> ;
    <http://purl.org/spar/cito/discusses> <https://arvix.org/abs/2207.15796> ;
    <http://purl.org/spar/cito/linksTo> <https://arvix.org/abs/2207.15796> ;
    rdfs:comment """ New paper alert! 🚨 We've been exploring the impact of context on LLM performance evaluation. Turns out, evaluating models on individual examples might not tell the whole story. #MachineLearning #AI

Our findings suggest that batch evaluation allows models to identify patterns and tendencies, leading to more nuanced assessments. Plus, a two-step decision process (analysis + scoring) shows promising results. Exciting times for ML eval! 📊🧠

To learn more, check out the paper: https://arvix.org/abs/2207.15796

""" ;
    schema:keywords "AI" , "LLM" , "MachineLearning" , "batch-evaluation" , "performance-evaluation" , "two-step-decision-process" ;
    <https://sense-nets.xyz/announcesResource> <https://arvix.org/abs/2207.15796> .
}
sub:provenance {
  <https://sense-nets.xyz/> a prov:SoftwareAgent ;
    prov:actedOnBehalfOf <https://w3id.org/np/RA8InlmUPoZ6CTtHP_RkqFBHJSnasnRcjI3qz7EJ-nHJY> .
  sub:activity a <https://sense-nets.xyz/supervisedActivity> ;
    prov:wasAssociatedWith <https://sense-nets.xyz/> .
  sub:assertion prov:linksTo <https://x.com/sensenets_demo/status/1839674524729483541> ;
    prov:wasAssociatedWith <https://x.com/sensenets_demo> ;
    prov:wasAttributedTo <https://w3id.org/np/RA8InlmUPoZ6CTtHP_RkqFBHJSnasnRcjI3qz7EJ-nHJY> ;
    prov:wasGeneratedBy sub:activity .
  <https://w3id.org/np/RA8InlmUPoZ6CTtHP_RkqFBHJSnasnRcjI3qz7EJ-nHJY> foaf:account <https://x.com/sensenets_demo> .
}
sub:pubinfo {
  sub:sig npx:hasAlgorithm "RSA" ;
    npx:hasPublicKey "MIIBIjANBgkqhkiG9w0BAQEFAAOCAQ8AMIIBCgKCAQEArHtI92jm8pAYVsvJabxLGfOT+7G0JyJGh2gwjB5x2pFPga6wWTd+rNBWWUZViIFnaJrBEsJpgdnoupLU9ppwn+khMiGRfxqGsDDzwHcj3Jc75CRys7d3etwXdBdoXfBgjsJiZBazwm13idr6tljRrC1TaEJBnRQAqzBw9cLDeGY77cSznzXT39feUGT168dpCSE9O6u/48DvvWVqciHGsH9cQ+LroJJVsMrorwtsdZnAK+q48wtIP6pIpw5shSJ5LnA0qeN/f4TvTFDV6ItYIXjiWWpTECc/Bxmfnyat3B5xWCu9nvz8fEs7Ns0TuzQwT3/K55iSKDEIi/E0nO97xwIDAQAB" ;
    npx:hasSignature "UfNKMSMxjJF6FmekyAFM3JrDGaiwLMq8OK0b3TsssKDHOlONBvYOzIWsO+Q5sDE3EGKMNcf0L9RvIgAwkaOJd4jgM4DgISHMEE7mOdJJ8+ogj3qea5jjPDXjwPAaUC1v51Hzc7v40LKALWGD3uJEyorHVpAL1z8FO9DlrLbu9sYzQ9zUHxvnRl0fJKGXkzzT1Z5ODlEs5c5/oq2L8LtKlDg5NSW/o2+5ELcKUDXF9cB2qGy8mymmlFXId4D4Q2BuE52/YtOLdRCJQhiEJaC9ZEw8NBUmDILw3NmKj7kOaU9BZzhQkWfc415rNBJSbXxwj6uM5JQIxTX6zUcwTEa9Sw==" ;
    npx:hasSignatureTarget this: ;
    npx:singedBy <https://sense-nets.xyz/> ;
    prov:wasAssociatedWith <https://w3id.org/np/RA8InlmUPoZ6CTtHP_RkqFBHJSnasnRcjI3qz7EJ-nHJYsigningDelegation> .
  this: dcterms:created "2024-09-27T15:38:26.351Z"^^xsd:dateTime ;
    dcterms:creator <https://w3id.org/np/RA8InlmUPoZ6CTtHP_RkqFBHJSnasnRcjI3qz7EJ-nHJY> ;
    dcterms:license <https://creativecommons.org/licenses/by/4.0/> ;
    npx:hasNanopubType <https://sense-nets.xyz/SemanticPost> ;
    npx:wasCreatedAt <https://sense-nets.xyz/> ;
    rdfs:label "CoSMO Semantic Post" ;
    <https://sense-nets.xyz/hasRootSigner> "0x5b9967FC42C160f6146d5ea1f0d08E88370f370b" .
  <https://w3id.org/np/RA8InlmUPoZ6CTtHP_RkqFBHJSnasnRcjI3qz7EJ-nHJY> foaf:name "Quinn Zhang, PhD" .
}