@prefix rdf:   <http://www.w3.org/1999/02/22-rdf-syntax-ns#> .
@prefix sl:    <http://www.semanlink.net/2001/00/semanlink-schema#> .
@prefix skos:  <http://www.w3.org/2004/02/skos/core#> .
@prefix rdfs:  <http://www.w3.org/2000/01/rdf-schema#> .
@prefix tag:   <http://www.semanlink.net/tag/> .
@prefix foaf:  <http://xmlns.com/foaf/0.1/> .
@prefix dc:    <http://purl.org/dc/elements/1.1/> .

<http://www.semanlink.net/doc/2025/02/benjamin_clavie_sur_x_what_i>
        dc:title         "Benjamin Clavié sur X : \"What if a [MASK] was all you needed?...\"" ;
        sl:creationDate  "2025-02-11" ;
        sl:tag           tag:tweet , tag:modernbert , tag:benjamin_clavie .

tag:arxiv_doc  a        sl:Tag ;
        skos:prefLabel  "Arxiv Doc" .

tag:long_context  a     sl:Tag ;
        skos:prefLabel  "Long Context" .

tag:retrieval_augmented_generation
        a               sl:Tag ;
        skos:prefLabel  "RAG" .

tag:modernbert  a       sl:Tag ;
        skos:prefLabel  "ModernBERT" .

tag:tweet  a            sl:Tag ;
        skos:prefLabel  "Tweet" .

tag:colbert  a          sl:Tag ;
        skos:prefLabel  "ColBERT" .

tag:mteb  a             sl:Tag ;
        skos:prefLabel  "MTEB" .

<http://www.semanlink.net/doc/2025/07/stop_saying_rag_is_dead_hamel>
        dc:title         "Stop Saying RAG Is Dead – Hamel’s Blog" ;
        sl:comment       "> Why the future of RAG lies in better retrieval, not bigger context windows." ;
        sl:creationDate  "2025-07-14" ;
        sl:tag           tag:retrieval_augmented_generation , tag:benjamin_clavie .

tag:text_embeddings  a  sl:Tag ;
        skos:prefLabel  "Text Embeddings" .

tag:jeremy_howard  a    sl:Tag ;
        skos:prefLabel  "Jeremy Howard" .

<http://www.semanlink.net/doc/2025/01/a_little_pooling_goes_a_long_wa>
        dc:title         "A little pooling goes a long way for multi-vector representations – Answer.AI" ;
        sl:comment       "> Intuition: for documents focusing on a low number of topics, a lot of the tokens are likely to carry somewhat redundant semantic information, meaning keeping all of them is likely not useful." ;
        sl:creationDate  "2025-01-24" ;
        sl:tag           tag:colbert , tag:benjamin_clavie , tag:answer_ai .

tag:reranker  a         sl:Tag ;
        skos:prefLabel  "Reranking" .

<http://www.semanlink.net/doc/2024/01/bclavie_ragatouille>
        dc:title         "bclavie/RAGatouille" ;
        sl:comment       "> RAGatouille's purpose is make it easy to use state-of-the-art methods in your RAG pipeline, without having to worry about the details or the years of literature! At the moment, RAGatouille focuses on making ColBERT simple to use.\r\n\r\n[Using ColBERT in-memory: Index-Free Encodings & Search](https://github.com/bclavie/RAGatouille/blob/0.0.5b1/examples/06-index_free_use.ipynb)\r\n```\r\nfrom ragatouille import RAGPretrainedModel\r\nRAG = RAGPretrainedModel.from_pretrained \"colbert-ir/colbertv2. 0\" )\r\n# Your documents, a plain old list of chunked strings.\r\ndocuments = [...]\r\n# In-memory indexing supports metadata too!\r\nmeta = ['attribute': ' really cool value'}...]\r\n# All the magic happens here\r\nRAG.encode documents, document_metadatas=meta)\r\n# Query your in-memory index\r\nRAG. search_encoded_docs(query = \"A great question\", k=3)\r\n# All further encode() calls add to the existing documents...\r\nRAG.encode(extra_documents, document_metadatas=extra_meta)\r\n# ... until you clear them\r\nRAG.clear_encoded\r\n```" ;
        sl:creationDate  "2024-01-26" ;
        sl:tag           tag:ragatouille , tag:retrieval_augmented_generation , tag:github_project , tag:colbert , tag:benjamin_clavie .

tag:nlp_girls_and_guys
        a               sl:Tag ;
        skos:prefLabel  "NLP girls and guys" .

tag:lighton  a          sl:Tag ;
        skos:prefLabel  "Lighton" .

<http://www.semanlink.net/doc/2025/01/benjamin_clavie_sur_x_%F0%9F%A7%B5_ste>
        dc:title         "Benjamin Clavié sur X : \"Stella Embeddings: What's the big deal?...\"" ;
        sl:comment       "> Training based on unsupervised distillation\r\n\r\n> The current dominant way of training retrieval models is via the use of a contrastive loss, with little-to-no knowledge distillation\r\n> (Stella's) training work within the embedding space, seeking to minimize the geometric distances... between the teachers' vectors and the student model (Stella)'s outputs.\r\n> \r\n> Stella models (and Jasper models) generalize amazingly well because of this.\r\n" ;
        sl:creationDate  "2025-01-13" ;
        sl:tag           tag:text_embeddings , tag:mteb , tag:knowledge_distillation , tag:benjamin_clavie .

<http://www.semanlink.net/doc/2024/03/benjamin_clavie_sur_x_docume>
        dc:title         "Benjamin Clavié sur X : \"Introducing rerankers: a lightweight library to provide a unified way to use various reranking methods\"" ;
        sl:creationDate  "2024-03-16" ;
        sl:tag           tag:twitter_thread , tag:reranker , tag:benjamin_clavie .

<http://www.semanlink.net/doc/2024/12/jeremy_howard_sur_x_i_ll_get>
        dc:title         "Jeremy Howard sur X : \"We trained 2 new models. Like BERT, but modern. ModernBERT. Not some hypey GenAI thing, but a proper workhorse model, for retrieval, classification, etc...\"" ;
        sl:comment       "<https://x.com/LightOnIO/status/1869785737832366306>" ;
        sl:creationDate  "2024-12-21" ;
        sl:tag           tag:twitter_thread , tag:modernbert , tag:lighton , tag:jeremy_howard , tag:benjamin_clavie .

<http://www.semanlink.net/doc/2024/12/2412_13663_smarter_better_f>
        dc:title         "[2412.13663] Smarter, Better, Faster, Longer: A Modern Bidirectional Encoder for Fast, Memory Efficient, and Long Context Finetuning and Inference" ;
        sl:creationDate  "2024-12-21" ;
        sl:tag           tag:modernbert , tag:long_context , tag:jeremy_howard , tag:benjamin_clavie , tag:arxiv_doc .

tag:answer_ai  a        sl:Tag ;
        skos:prefLabel  "Answer.AI" .

tag:ragatouille  a      sl:Tag ;
        skos:prefLabel  "RAGatouille" .

tag:benjamin_clavie  a    sl:Tag ;
        rdfs:isDefinedBy  tag:benjamin_clavie.n3 ;
        sl:comment        "@bclavie" ;
        skos:broader      tag:nlp_girls_and_guys ;
        skos:prefLabel    "Benjamin Clavié" ;
        skos:related      tag:ragatouille , tag:answer_ai ;
        foaf:page         tag:benjamin_clavie.html .

tag:github_project  a   sl:Tag ;
        skos:prefLabel  "GitHub project" .

tag:knowledge_distillation
        a               sl:Tag ;
        skos:prefLabel  "Knowledge distillation" .

tag:twitter_thread  a   sl:Tag ;
        skos:prefLabel  "Twitter thread" .
