https://w3id.org/np/RA6amI79BFW1axJuNM0PmqefGYO-SWR72EoGG5fb0KuB0
.trig | .trig.txt | .jelly | .jelly.txt
@prefix this: <https://w3id.org/np/RA6amI79BFW1axJuNM0PmqefGYO-SWR72EoGG5fb0KuB0> . @prefix sub: <https://w3id.org/np/RA6amI79BFW1axJuNM0PmqefGYO-SWR72EoGG5fb0KuB0#> . @prefix rdfs: <http://www.w3.org/2000/01/rdf-schema#> . @prefix xsd: <http://www.w3.org/2001/XMLSchema#> . @prefix np: <http://www.nanopub.org/nschema#> . @prefix npx: <http://purl.org/nanopub/x/> . @prefix dcterms: <http://purl.org/dc/terms/> . @prefix prov: <http://www.w3.org/ns/prov#> . @prefix schema: <https://schema.org/> . @prefix foaf: <http://xmlns.com/foaf/0.1/> . sub:head { this: a np:Nanopublication; np:hasAssertion sub:assertion; np:hasProvenance sub:provenance; np:hasPublicationInfo sub:pubinfo . } sub:assertion { <https://arvix.org/abs/2207.15796> <https://sense-nets.xyz/hasZoteroItemType> "webpage" . sub:assertion dcterms:creator <https://w3id.org/np/RA8InlmUPoZ6CTtHP_RkqFBHJSnasnRcjI3qz7EJ-nHJY>; <http://purl.org/spar/cito/discusses> <https://arvix.org/abs/2207.15796>; <http://purl.org/spar/cito/linksTo> <https://arvix.org/abs/2207.15796>; rdfs:comment """ New paper alert! We've been exploring the impact of context on LLM performance evaluation. Turns out, evaluating models on individual examples might not tell the whole story. #MachineLearning #AI Our findings suggest that batch evaluation allows models to identify patterns and tendencies, leading to more nuanced assessments. Plus, a two-step decision process (analysis + scoring) shows promising results. Exciting times for ML eval! To learn more, check out the paper: https://arvix.org/abs/2207.15796 """; schema:keywords "AI", "LLM", "MachineLearning", "batch-evaluation", "performance-evaluation", "two-step-decision-process"; <https://sense-nets.xyz/announcesResource> <https://arvix.org/abs/2207.15796> . } sub:provenance { <https://sense-nets.xyz/> a prov:SoftwareAgent; prov:actedOnBehalfOf <https://w3id.org/np/RA8InlmUPoZ6CTtHP_RkqFBHJSnasnRcjI3qz7EJ-nHJY> . sub:activity a <https://sense-nets.xyz/supervisedActivity>; prov:wasAssociatedWith <https://sense-nets.xyz/> . sub:assertion prov:linksTo <https://x.com/sensenets_demo/status/1839674524729483541>; prov:wasAssociatedWith <https://x.com/sensenets_demo>; prov:wasAttributedTo <https://w3id.org/np/RA8InlmUPoZ6CTtHP_RkqFBHJSnasnRcjI3qz7EJ-nHJY>; prov:wasGeneratedBy sub:activity . <https://w3id.org/np/RA8InlmUPoZ6CTtHP_RkqFBHJSnasnRcjI3qz7EJ-nHJY> foaf:account <https://x.com/sensenets_demo> . } sub:pubinfo { sub:sig npx:hasAlgorithm "RSA"; npx:hasPublicKey "MIIBIjANBgkqhkiG9w0BAQEFAAOCAQ8AMIIBCgKCAQEArHtI92jm8pAYVsvJabxLGfOT+7G0JyJGh2gwjB5x2pFPga6wWTd+rNBWWUZViIFnaJrBEsJpgdnoupLU9ppwn+khMiGRfxqGsDDzwHcj3Jc75CRys7d3etwXdBdoXfBgjsJiZBazwm13idr6tljRrC1TaEJBnRQAqzBw9cLDeGY77cSznzXT39feUGT168dpCSE9O6u/48DvvWVqciHGsH9cQ+LroJJVsMrorwtsdZnAK+q48wtIP6pIpw5shSJ5LnA0qeN/f4TvTFDV6ItYIXjiWWpTECc/Bxmfnyat3B5xWCu9nvz8fEs7Ns0TuzQwT3/K55iSKDEIi/E0nO97xwIDAQAB"; npx:hasSignature "UfNKMSMxjJF6FmekyAFM3JrDGaiwLMq8OK0b3TsssKDHOlONBvYOzIWsO+Q5sDE3EGKMNcf0L9RvIgAwkaOJd4jgM4DgISHMEE7mOdJJ8+ogj3qea5jjPDXjwPAaUC1v51Hzc7v40LKALWGD3uJEyorHVpAL1z8FO9DlrLbu9sYzQ9zUHxvnRl0fJKGXkzzT1Z5ODlEs5c5/oq2L8LtKlDg5NSW/o2+5ELcKUDXF9cB2qGy8mymmlFXId4D4Q2BuE52/YtOLdRCJQhiEJaC9ZEw8NBUmDILw3NmKj7kOaU9BZzhQkWfc415rNBJSbXxwj6uM5JQIxTX6zUcwTEa9Sw=="; npx:hasSignatureTarget this:; npx:singedBy <https://sense-nets.xyz/>; prov:wasAssociatedWith <https://w3id.org/np/RA8InlmUPoZ6CTtHP_RkqFBHJSnasnRcjI3qz7EJ-nHJYsigningDelegation> . this: dcterms:created "2024-09-27T15:38:26.351Z"^^xsd:dateTime; dcterms:creator <https://w3id.org/np/RA8InlmUPoZ6CTtHP_RkqFBHJSnasnRcjI3qz7EJ-nHJY>; dcterms:license <https://creativecommons.org/licenses/by/4.0/>; npx:hasNanopubType <https://sense-nets.xyz/SemanticPost>; npx:wasCreatedAt <https://sense-nets.xyz/>; rdfs:label "CoSMO Semantic Post"; <https://sense-nets.xyz/hasRootSigner> "0x5b9967FC42C160f6146d5ea1f0d08E88370f370b" . <https://w3id.org/np/RA8InlmUPoZ6CTtHP_RkqFBHJSnasnRcjI3qz7EJ-nHJY> foaf:name "Quinn Zhang, PhD" . }